Diff 153879

llvm/trunk/lib/Transforms/Scalar/SimpleLoopUnswitch.cpp

Show First 20 Lines • Show All 247 Lines • ▼ Show 20 Lines
///		///
/// If this routine fails to unswitch the branch it returns false.		/// If this routine fails to unswitch the branch it returns false.
///		///
/// If the branch can be unswitched, this routine splits the preheader and		/// If the branch can be unswitched, this routine splits the preheader and
/// hoists the branch above that split. Preserves loop simplified form		/// hoists the branch above that split. Preserves loop simplified form
/// (splitting the exit block as necessary). It simplifies the branch within		/// (splitting the exit block as necessary). It simplifies the branch within
/// the loop to an unconditional branch but doesn't remove it entirely. Further		/// the loop to an unconditional branch but doesn't remove it entirely. Further
/// cleanup can be done with some simplify-cfg like pass.		/// cleanup can be done with some simplify-cfg like pass.
		///
		/// If `SE` is not null, it will be updated based on the potential loop SCEVs
		/// invalidated by this.
static bool unswitchTrivialBranch(Loop &L, BranchInst &BI, DominatorTree &DT,		static bool unswitchTrivialBranch(Loop &L, BranchInst &BI, DominatorTree &DT,
LoopInfo &LI) {		LoopInfo &LI, ScalarEvolution *SE) {
assert(BI.isConditional() && "Can only unswitch a conditional branch!");		assert(BI.isConditional() && "Can only unswitch a conditional branch!");
LLVM_DEBUG(dbgs() << " Trying to unswitch branch: " << BI << "\n");		LLVM_DEBUG(dbgs() << " Trying to unswitch branch: " << BI << "\n");

// The loop invariant values that we want to unswitch.		// The loop invariant values that we want to unswitch.
TinyPtrVector<Value *> Invariants;		TinyPtrVector<Value *> Invariants;

// When true, we're fully unswitching the branch rather than just unswitching		// When true, we're fully unswitching the branch rather than just unswitching
// some input conditions to the branch.		// some input conditions to the branch.
▲ Show 20 Lines • Show All 47 Lines • ▼ Show 20 Lines	LLVM_DEBUG({
for (Value *Invariant : Invariants) {		for (Value *Invariant : Invariants) {
dbgs() << " " << *Invariant << " == true";		dbgs() << " " << *Invariant << " == true";
if (Invariant != Invariants.back())		if (Invariant != Invariants.back())
dbgs() << " \|\|";		dbgs() << " \|\|";
dbgs() << "\n";		dbgs() << "\n";
}		}
});		});

		// If we have scalar evolutions, we need to invalidate them including this
		// loop and the loop containing the exit block.
		if (SE) {
		if (Loop *ExitL = LI.getLoopFor(LoopExitBB))
		SE->forgetLoop(ExitL);
		else
		// Forget the entire nest as this exits the entire nest.
		SE->forgetTopmostLoop(&L);
		}

// Split the preheader, so that we know that there is a safe place to insert		// Split the preheader, so that we know that there is a safe place to insert
// the conditional branch. We will change the preheader to have a conditional		// the conditional branch. We will change the preheader to have a conditional
// branch on LoopCond.		// branch on LoopCond.
BasicBlock *OldPH = L.getLoopPreheader();		BasicBlock *OldPH = L.getLoopPreheader();
BasicBlock *NewPH = SplitEdge(OldPH, L.getHeader(), &DT, &LI);		BasicBlock *NewPH = SplitEdge(OldPH, L.getHeader(), &DT, &LI);

// Now that we have a place to insert the conditional branch, create a place		// Now that we have a place to insert the conditional branch, create a place
// to branch to: this is the exit block out of the loop that we are		// to branch to: this is the exit block out of the loop that we are
▲ Show 20 Lines • Show All 86 Lines • ▼ Show 20 Lines
/// (splitting the exit blocks as necessary). It simplifies the switch within		/// (splitting the exit blocks as necessary). It simplifies the switch within
/// the loop by removing now-dead cases. If the default case is one of those		/// the loop by removing now-dead cases. If the default case is one of those
/// unswitched, it replaces its destination with a new basic block containing		/// unswitched, it replaces its destination with a new basic block containing
/// only unreachable. Such basic blocks, while technically loop exits, are not		/// only unreachable. Such basic blocks, while technically loop exits, are not
/// considered for unswitching so this is a stable transform and the same		/// considered for unswitching so this is a stable transform and the same
/// switch will not be revisited. If after unswitching there is only a single		/// switch will not be revisited. If after unswitching there is only a single
/// in-loop successor, the switch is further simplified to an unconditional		/// in-loop successor, the switch is further simplified to an unconditional
/// branch. Still more cleanup can be done with some simplify-cfg like pass.		/// branch. Still more cleanup can be done with some simplify-cfg like pass.
		///
		/// If `SE` is not null, it will be updated based on the potential loop SCEVs
		/// invalidated by this.
static bool unswitchTrivialSwitch(Loop &L, SwitchInst &SI, DominatorTree &DT,		static bool unswitchTrivialSwitch(Loop &L, SwitchInst &SI, DominatorTree &DT,
LoopInfo &LI) {		LoopInfo &LI, ScalarEvolution *SE) {
LLVM_DEBUG(dbgs() << " Trying to unswitch switch: " << SI << "\n");		LLVM_DEBUG(dbgs() << " Trying to unswitch switch: " << SI << "\n");
Value *LoopCond = SI.getCondition();		Value *LoopCond = SI.getCondition();

// If this isn't switching on an invariant condition, we can't unswitch it.		// If this isn't switching on an invariant condition, we can't unswitch it.
if (!L.isLoopInvariant(LoopCond))		if (!L.isLoopInvariant(LoopCond))
return false;		return false;

auto *ParentBB = SI.getParent();		auto *ParentBB = SI.getParent();
Show All 10 Lines	if (!L.contains(SI.getDefaultDest()) &&
areLoopExitPHIsLoopInvariant(L, ParentBB, SI.getDefaultDest()) &&		areLoopExitPHIsLoopInvariant(L, ParentBB, SI.getDefaultDest()) &&
!isa<UnreachableInst>(SI.getDefaultDest()->getTerminator()))		!isa<UnreachableInst>(SI.getDefaultDest()->getTerminator()))
DefaultExitBB = SI.getDefaultDest();		DefaultExitBB = SI.getDefaultDest();
else if (ExitCaseIndices.empty())		else if (ExitCaseIndices.empty())
return false;		return false;

LLVM_DEBUG(dbgs() << " unswitching trivial cases...\n");		LLVM_DEBUG(dbgs() << " unswitching trivial cases...\n");

		// We may need to invalidate SCEVs for the outermost loop reached by any of
		// the exits.
		Loop *OuterL = &L;

SmallVector<std::pair<ConstantInt , BasicBlock >, 4> ExitCases;		SmallVector<std::pair<ConstantInt , BasicBlock >, 4> ExitCases;
ExitCases.reserve(ExitCaseIndices.size());		ExitCases.reserve(ExitCaseIndices.size());
// We walk the case indices backwards so that we remove the last case first		// We walk the case indices backwards so that we remove the last case first
// and don't disrupt the earlier indices.		// and don't disrupt the earlier indices.
for (unsigned Index : reverse(ExitCaseIndices)) {		for (unsigned Index : reverse(ExitCaseIndices)) {
auto CaseI = SI.case_begin() + Index;		auto CaseI = SI.case_begin() + Index;
		// Compute the outer loop from this exit.
		Loop *ExitL = LI.getLoopFor(CaseI->getCaseSuccessor());
		if (!ExitL \|\| ExitL->contains(OuterL))
		OuterL = ExitL;
// Save the value of this case.		// Save the value of this case.
ExitCases.push_back({CaseI->getCaseValue(), CaseI->getCaseSuccessor()});		ExitCases.push_back({CaseI->getCaseValue(), CaseI->getCaseSuccessor()});
// Delete the unswitched cases.		// Delete the unswitched cases.
SI.removeCase(CaseI);		SI.removeCase(CaseI);
}		}

		if (SE) {
		if (OuterL)
		SE->forgetLoop(OuterL);
		else
		SE->forgetTopmostLoop(&L);
		}

// Check if after this all of the remaining cases point at the same		// Check if after this all of the remaining cases point at the same
// successor.		// successor.
BasicBlock *CommonSuccBB = nullptr;		BasicBlock *CommonSuccBB = nullptr;
if (SI.getNumCases() > 0 &&		if (SI.getNumCases() > 0 &&
std::all_of(std::next(SI.case_begin()), SI.case_end(),		std::all_of(std::next(SI.case_begin()), SI.case_end(),
[&SI](const SwitchInst::CaseHandle &Case) {		[&SI](const SwitchInst::CaseHandle &Case) {
return Case.getCaseSuccessor() ==		return Case.getCaseSuccessor() ==
SI.case_begin()->getCaseSuccessor();		SI.case_begin()->getCaseSuccessor();
▲ Show 20 Lines • Show All 141 Lines • ▼ Show 20 Lines
/// any side effects occur. These can potentially be unswitched without		/// any side effects occur. These can potentially be unswitched without
/// duplicating the loop. If a branch or switch is successfully unswitched the		/// duplicating the loop. If a branch or switch is successfully unswitched the
/// scanning continues to see if subsequent branches or switches have become		/// scanning continues to see if subsequent branches or switches have become
/// trivial. Once all trivial candidates have been unswitched, this routine		/// trivial. Once all trivial candidates have been unswitched, this routine
/// returns.		/// returns.
///		///
/// The return value indicates whether anything was unswitched (and therefore		/// The return value indicates whether anything was unswitched (and therefore
/// changed).		/// changed).
		///
		/// If `SE` is not null, it will be updated based on the potential loop SCEVs
		/// invalidated by this.
static bool unswitchAllTrivialConditions(Loop &L, DominatorTree &DT,		static bool unswitchAllTrivialConditions(Loop &L, DominatorTree &DT,
LoopInfo &LI) {		LoopInfo &LI, ScalarEvolution *SE) {
bool Changed = false;		bool Changed = false;

// If loop header has only one reachable successor we should keep looking for		// If loop header has only one reachable successor we should keep looking for
// trivial condition candidates in the successor as well. An alternative is		// trivial condition candidates in the successor as well. An alternative is
// to constant fold conditions and merge successors into loop header (then we		// to constant fold conditions and merge successors into loop header (then we
// only need to check header's terminator). The reason for not doing this in		// only need to check header's terminator). The reason for not doing this in
// LoopUnswitch pass is that it could potentially break LoopPassManager's		// LoopUnswitch pass is that it could potentially break LoopPassManager's
// invariants. Folding dead branches could either eliminate the current loop		// invariants. Folding dead branches could either eliminate the current loop
Show All 17 Lines	do {

if (auto *SI = dyn_cast<SwitchInst>(CurrentTerm)) {		if (auto *SI = dyn_cast<SwitchInst>(CurrentTerm)) {
// Don't bother trying to unswitch past a switch with a constant		// Don't bother trying to unswitch past a switch with a constant
// condition. This should be removed prior to running this pass by		// condition. This should be removed prior to running this pass by
// simplify-cfg.		// simplify-cfg.
if (isa<Constant>(SI->getCondition()))		if (isa<Constant>(SI->getCondition()))
return Changed;		return Changed;

if (!unswitchTrivialSwitch(L, *SI, DT, LI))		if (!unswitchTrivialSwitch(L, *SI, DT, LI, SE))
// Couldn't unswitch this one so we're done.		// Couldn't unswitch this one so we're done.
return Changed;		return Changed;

// Mark that we managed to unswitch something.		// Mark that we managed to unswitch something.
Changed = true;		Changed = true;

// If unswitching turned the terminator into an unconditional branch then		// If unswitching turned the terminator into an unconditional branch then
// we can continue. The unswitching logic specifically works to fold any		// we can continue. The unswitching logic specifically works to fold any
Show All 15 Lines	do {
// Don't bother trying to unswitch past an unconditional branch or a branch		// Don't bother trying to unswitch past an unconditional branch or a branch
// with a constant value. These should be removed by simplify-cfg prior to		// with a constant value. These should be removed by simplify-cfg prior to
// running this pass.		// running this pass.
if (!BI->isConditional() \|\| isa<Constant>(BI->getCondition()))		if (!BI->isConditional() \|\| isa<Constant>(BI->getCondition()))
return Changed;		return Changed;

// Found a trivial condition candidate: non-foldable conditional branch. If		// Found a trivial condition candidate: non-foldable conditional branch. If
// we fail to unswitch this, we can't do anything else that is trivial.		// we fail to unswitch this, we can't do anything else that is trivial.
if (!unswitchTrivialBranch(L, *BI, DT, LI))		if (!unswitchTrivialBranch(L, *BI, DT, LI, SE))
return Changed;		return Changed;

// Mark that we managed to unswitch something.		// Mark that we managed to unswitch something.
Changed = true;		Changed = true;

// If we only unswitched some of the conditions feeding the branch, we won't		// If we only unswitched some of the conditions feeding the branch, we won't
// have collapsed it to a single successor.		// have collapsed it to a single successor.
BI = cast<BranchInst>(CurrentBB->getTerminator());		BI = cast<BranchInst>(CurrentBB->getTerminator());
▲ Show 20 Lines • Show All 921 Lines • ▼ Show 20 Lines	for (DomTreeNode ChildN : N) {
DomWorklist.push_back(ChildN);		DomWorklist.push_back(ChildN);
}		}
} while (!DomWorklist.empty());		} while (!DomWorklist.empty());
}		}

static bool unswitchNontrivialInvariants(		static bool unswitchNontrivialInvariants(
Loop &L, TerminatorInst &TI, ArrayRef<Value *> Invariants,		Loop &L, TerminatorInst &TI, ArrayRef<Value *> Invariants,
DominatorTree &DT, LoopInfo &LI, AssumptionCache &AC,		DominatorTree &DT, LoopInfo &LI, AssumptionCache &AC,
function_ref<void(bool, ArrayRef<Loop *>)> UnswitchCB) {		function_ref<void(bool, ArrayRef<Loop *>)> UnswitchCB,
		ScalarEvolution *SE) {
auto *ParentBB = TI.getParent();		auto *ParentBB = TI.getParent();
BranchInst *BI = dyn_cast<BranchInst>(&TI);		BranchInst *BI = dyn_cast<BranchInst>(&TI);
SwitchInst *SI = BI ? nullptr : cast<SwitchInst>(&TI);		SwitchInst *SI = BI ? nullptr : cast<SwitchInst>(&TI);

// We can only unswitch switches, conditional branches with an invariant		// We can only unswitch switches, conditional branches with an invariant
// condition, or combining invariant conditions with an instruction.		// condition, or combining invariant conditions with an instruction.
assert((SI \|\| BI->isConditional()) &&		assert((SI \|\| BI->isConditional()) &&
"Can only unswitch switches and conditional branch!");		"Can only unswitch switches and conditional branch!");
▲ Show 20 Lines • Show All 66 Lines • ▼ Show 20 Lines	if (!NewOuterExitL) {
// We exited the entire nest with this block, so we're done.		// We exited the entire nest with this block, so we're done.
OuterExitL = nullptr;		OuterExitL = nullptr;
break;		break;
}		}
if (NewOuterExitL != OuterExitL && NewOuterExitL->contains(OuterExitL))		if (NewOuterExitL != OuterExitL && NewOuterExitL->contains(OuterExitL))
OuterExitL = NewOuterExitL;		OuterExitL = NewOuterExitL;
}		}

		// At this point, we're definitely going to unswitch something so invalidate
		// any cached information in ScalarEvolution for the outer most loop
		// containing an exit block and all nested loops.
		if (SE) {
		if (OuterExitL)
		SE->forgetLoop(OuterExitL);
		else
		SE->forgetTopmostLoop(&L);
		}

// If the edge from this terminator to a successor dominates that successor,		// If the edge from this terminator to a successor dominates that successor,
// store a map from each block in its dominator subtree to it. This lets us		// store a map from each block in its dominator subtree to it. This lets us
// tell when cloning for a particular successor if a block is dominated by		// tell when cloning for a particular successor if a block is dominated by
// some other successor with a single data structure. We use this to		// some other successor with a single data structure. We use this to
// significantly reduce cloning.		// significantly reduce cloning.
SmallDenseMap<BasicBlock , BasicBlock , 16> DominatingSucc;		SmallDenseMap<BasicBlock , BasicBlock , 16> DominatingSucc;
for (auto SuccBB : llvm::concat<BasicBlock const>(		for (auto SuccBB : llvm::concat<BasicBlock const>(
makeArrayRef(RetainedSuccBB), UnswitchedSuccBBs))		makeArrayRef(RetainedSuccBB), UnswitchedSuccBBs))
▲ Show 20 Lines • Show All 247 Lines • ▼ Show 20 Lines	int Cost = std::accumulate(
return Sum + computeDomSubtreeCost(*ChildN, BBCostMap, DTCostMap);		return Sum + computeDomSubtreeCost(*ChildN, BBCostMap, DTCostMap);
});		});
bool Inserted = DTCostMap.insert({&N, Cost}).second;		bool Inserted = DTCostMap.insert({&N, Cost}).second;
(void)Inserted;		(void)Inserted;
assert(Inserted && "Should not insert a node while visiting children!");		assert(Inserted && "Should not insert a node while visiting children!");
return Cost;		return Cost;
}		}

static bool unswitchBestCondition(		static bool
Loop &L, DominatorTree &DT, LoopInfo &LI, AssumptionCache &AC,		unswitchBestCondition(Loop &L, DominatorTree &DT, LoopInfo &LI,
TargetTransformInfo &TTI,		AssumptionCache &AC, TargetTransformInfo &TTI,
function_ref<void(bool, ArrayRef<Loop *>)> UnswitchCB) {		function_ref<void(bool, ArrayRef<Loop *>)> UnswitchCB,
		ScalarEvolution *SE) {
// Collect all invariant conditions within this loop (as opposed to an inner		// Collect all invariant conditions within this loop (as opposed to an inner
// loop which would be handled when visiting that inner loop).		// loop which would be handled when visiting that inner loop).
SmallVector<std::pair<TerminatorInst , TinyPtrVector<Value >>, 4>		SmallVector<std::pair<TerminatorInst , TinyPtrVector<Value >>, 4>
UnswitchCandidates;		UnswitchCandidates;
for (auto *BB : L.blocks()) {		for (auto *BB : L.blocks()) {
if (LI.getLoopFor(BB) != &L)		if (LI.getLoopFor(BB) != &L)
continue;		continue;

▲ Show 20 Lines • Show All 176 Lines • ▼ Show 20 Lines	LLVM_DEBUG(dbgs() << "Cannot unswitch, lowest cost found: "
<< BestUnswitchCost << "\n");		<< BestUnswitchCost << "\n");
return false;		return false;
}		}

LLVM_DEBUG(dbgs() << " Trying to unswitch non-trivial (cost = "		LLVM_DEBUG(dbgs() << " Trying to unswitch non-trivial (cost = "
<< BestUnswitchCost << ") terminator: " << *BestUnswitchTI		<< BestUnswitchCost << ") terminator: " << *BestUnswitchTI
<< "\n");		<< "\n");
return unswitchNontrivialInvariants(		return unswitchNontrivialInvariants(
L, *BestUnswitchTI, BestUnswitchInvariants, DT, LI, AC, UnswitchCB);		L, *BestUnswitchTI, BestUnswitchInvariants, DT, LI, AC, UnswitchCB, SE);
}		}

/// Unswitch control flow predicated on loop invariant conditions.		/// Unswitch control flow predicated on loop invariant conditions.
///		///
/// This first hoists all branches or switches which are trivial (IE, do not		/// This first hoists all branches or switches which are trivial (IE, do not
/// require duplicating any part of the loop) out of the loop body. It then		/// require duplicating any part of the loop) out of the loop body. It then
/// looks at other loop invariant control flows and tries to unswitch those as		/// looks at other loop invariant control flows and tries to unswitch those as
/// well by cloning the loop if the result is small enough.		/// well by cloning the loop if the result is small enough.
static bool		///
unswitchLoop(Loop &L, DominatorTree &DT, LoopInfo &LI, AssumptionCache &AC,		/// The `DT`, `LI`, `AC`, `TTI` parameters are required analyses that are also
TargetTransformInfo &TTI, bool NonTrivial,		/// updated based on the unswitch.
function_ref<void(bool, ArrayRef<Loop *>)> UnswitchCB) {		///
		/// If either `NonTrivial` is true or the flag `EnableNonTrivialUnswitch` is
		/// true, we will attempt to do non-trivial unswitching as well as trivial
		/// unswitching.
		///
		/// The `UnswitchCB` callback provided will be run after unswitching is
		/// complete, with the first parameter set to `true` if the provided loop
		/// remains a loop, and a list of new sibling loops created.
		///
		/// If `SE` is non-null, we will update that analysis based on the unswitching
		/// done.
		static bool unswitchLoop(Loop &L, DominatorTree &DT, LoopInfo &LI,
		AssumptionCache &AC, TargetTransformInfo &TTI,
		bool NonTrivial,
		function_ref<void(bool, ArrayRef<Loop *>)> UnswitchCB,
		ScalarEvolution *SE) {
assert(L.isRecursivelyLCSSAForm(DT, LI) &&		assert(L.isRecursivelyLCSSAForm(DT, LI) &&
"Loops must be in LCSSA form before unswitching.");		"Loops must be in LCSSA form before unswitching.");
bool Changed = false;		bool Changed = false;

// Must be in loop simplified form: we need a preheader and dedicated exits.		// Must be in loop simplified form: we need a preheader and dedicated exits.
if (!L.isLoopSimplifyForm())		if (!L.isLoopSimplifyForm())
return false;		return false;

// Try trivial unswitch first before loop over other basic blocks in the loop.		// Try trivial unswitch first before loop over other basic blocks in the loop.
if (unswitchAllTrivialConditions(L, DT, LI)) {		if (unswitchAllTrivialConditions(L, DT, LI, SE)) {
// If we unswitched successfully we will want to clean up the loop before		// If we unswitched successfully we will want to clean up the loop before
// processing it further so just mark it as unswitched and return.		// processing it further so just mark it as unswitched and return.
UnswitchCB(/CurrentLoopValid/ true, {});		UnswitchCB(/CurrentLoopValid/ true, {});
return true;		return true;
}		}

// If we're not doing non-trivial unswitching, we're done. We both accept		// If we're not doing non-trivial unswitching, we're done. We both accept
// a parameter but also check a local flag that can be used for testing		// a parameter but also check a local flag that can be used for testing
// a debugging.		// a debugging.
if (!NonTrivial && !EnableNonTrivialUnswitch)		if (!NonTrivial && !EnableNonTrivialUnswitch)
return false;		return false;

// For non-trivial unswitching, because it often creates new loops, we rely on		// For non-trivial unswitching, because it often creates new loops, we rely on
// the pass manager to iterate on the loops rather than trying to immediately		// the pass manager to iterate on the loops rather than trying to immediately
// reach a fixed point. There is no substantial advantage to iterating		// reach a fixed point. There is no substantial advantage to iterating
// internally, and if any of the new loops are simplified enough to contain		// internally, and if any of the new loops are simplified enough to contain
// trivial unswitching we want to prefer those.		// trivial unswitching we want to prefer those.

// Try to unswitch the best invariant condition. We prefer this full unswitch to		// Try to unswitch the best invariant condition. We prefer this full unswitch to
// a partial unswitch when possible below the threshold.		// a partial unswitch when possible below the threshold.
if (unswitchBestCondition(L, DT, LI, AC, TTI, UnswitchCB))		if (unswitchBestCondition(L, DT, LI, AC, TTI, UnswitchCB, SE))
return true;		return true;

// No other opportunities to unswitch.		// No other opportunities to unswitch.
return Changed;		return Changed;
}		}

PreservedAnalyses SimpleLoopUnswitchPass::run(Loop &L, LoopAnalysisManager &AM,		PreservedAnalyses SimpleLoopUnswitchPass::run(Loop &L, LoopAnalysisManager &AM,
LoopStandardAnalysisResults &AR,		LoopStandardAnalysisResults &AR,
Show All 17 Lines	auto UnswitchCB = [&L, &U, &LoopName](bool CurrentLoopValid,
// If the current loop remains valid, we should revisit it to catch any		// If the current loop remains valid, we should revisit it to catch any
// other unswitch opportunities. Otherwise, we need to mark it as deleted.		// other unswitch opportunities. Otherwise, we need to mark it as deleted.
if (CurrentLoopValid)		if (CurrentLoopValid)
U.revisitCurrentLoop();		U.revisitCurrentLoop();
else		else
U.markLoopAsDeleted(L, LoopName);		U.markLoopAsDeleted(L, LoopName);
};		};

if (!unswitchLoop(L, AR.DT, AR.LI, AR.AC, AR.TTI, NonTrivial,		if (!unswitchLoop(L, AR.DT, AR.LI, AR.AC, AR.TTI, NonTrivial, UnswitchCB,
UnswitchCB))		&AR.SE))
return PreservedAnalyses::all();		return PreservedAnalyses::all();

// Historically this pass has had issues with the dominator tree so verify it		// Historically this pass has had issues with the dominator tree so verify it
// in asserts builds.		// in asserts builds.
assert(AR.DT.verify(DominatorTree::VerificationLevel::Fast));		assert(AR.DT.verify(DominatorTree::VerificationLevel::Fast));
return getLoopPassPreservedAnalyses();		return getLoopPassPreservedAnalyses();
}		}

Show All 31 Lines	bool SimpleLoopUnswitchLegacyPass::runOnLoop(Loop *L, LPPassManager &LPM) {
LLVM_DEBUG(dbgs() << "Unswitching loop in " << F.getName() << ": " << *L		LLVM_DEBUG(dbgs() << "Unswitching loop in " << F.getName() << ": " << *L
<< "\n");		<< "\n");

auto &DT = getAnalysis<DominatorTreeWrapperPass>().getDomTree();		auto &DT = getAnalysis<DominatorTreeWrapperPass>().getDomTree();
auto &LI = getAnalysis<LoopInfoWrapperPass>().getLoopInfo();		auto &LI = getAnalysis<LoopInfoWrapperPass>().getLoopInfo();
auto &AC = getAnalysis<AssumptionCacheTracker>().getAssumptionCache(F);		auto &AC = getAnalysis<AssumptionCacheTracker>().getAssumptionCache(F);
auto &TTI = getAnalysis<TargetTransformInfoWrapperPass>().getTTI(F);		auto &TTI = getAnalysis<TargetTransformInfoWrapperPass>().getTTI(F);

		auto *SEWP = getAnalysisIfAvailable<ScalarEvolutionWrapperPass>();
		auto *SE = SEWP ? &SEWP->getSE() : nullptr;

auto UnswitchCB = [&L, &LPM](bool CurrentLoopValid,		auto UnswitchCB = [&L, &LPM](bool CurrentLoopValid,
ArrayRef<Loop *> NewLoops) {		ArrayRef<Loop *> NewLoops) {
// If we did a non-trivial unswitch, we have added new (cloned) loops.		// If we did a non-trivial unswitch, we have added new (cloned) loops.
for (auto *NewL : NewLoops)		for (auto *NewL : NewLoops)
LPM.addLoop(*NewL);		LPM.addLoop(*NewL);

// If the current loop remains valid, re-add it to the queue. This is		// If the current loop remains valid, re-add it to the queue. This is
// a little wasteful as we'll finish processing the current loop as well,		// a little wasteful as we'll finish processing the current loop as well,
// but it is the best we can do in the old PM.		// but it is the best we can do in the old PM.
if (CurrentLoopValid)		if (CurrentLoopValid)
LPM.addLoop(*L);		LPM.addLoop(*L);
else		else
LPM.markLoopAsDeleted(*L);		LPM.markLoopAsDeleted(*L);
};		};

bool Changed =		bool Changed = unswitchLoop(*L, DT, LI, AC, TTI, NonTrivial, UnswitchCB, SE);
unswitchLoop(*L, DT, LI, AC, TTI, NonTrivial, UnswitchCB);

// If anything was unswitched, also clear any cached information about this		// If anything was unswitched, also clear any cached information about this
// loop.		// loop.
LPM.deleteSimpleAnalysisLoop(L);		LPM.deleteSimpleAnalysisLoop(L);

// Historically this pass has had issues with the dominator tree so verify it		// Historically this pass has had issues with the dominator tree so verify it
// in asserts builds.		// in asserts builds.
assert(DT.verify(DominatorTree::VerificationLevel::Fast));		assert(DT.verify(DominatorTree::VerificationLevel::Fast));
Show All 18 Lines

llvm/trunk/test/Transforms/SimpleLoopUnswitch/update-scev.ll

				; RUN: opt -passes='print<scalar-evolution>,loop(unswitch,loop-instsimplify),print<scalar-evolution>' -enable-nontrivial-unswitch -S < %s 2>%t.scev \| FileCheck %s
				; RUN: FileCheck %s --check-prefix=SCEV < %t.scev

				target triple = "x86_64-unknown-linux-gnu"

				declare void @f()

				; Check that trivially unswitching an inner loop resets both the inner and outer
				; loop trip count.
				define void @test1(i32 %n, i32 %m, i1 %cond) {
				; Check that SCEV has no trip count before unswitching.
				; SCEV-LABEL: Determining loop execution counts for: @test1
				; SCEV: Loop %inner_loop_begin: <multiple exits> Unpredictable backedge-taken count.
				; SCEV: Loop %outer_loop_begin: Unpredictable backedge-taken count.
				;
				; Now check that after unswitching and simplifying instructions we get clean
				; backedge-taken counts.
				; SCEV-LABEL: Determining loop execution counts for: @test1
				; SCEV: Loop %inner_loop_begin: backedge-taken count is (-1 + (1 smax %m))<nsw>
				; SCEV: Loop %outer_loop_begin: backedge-taken count is (-1 + (1 smax %n))<nsw>
				;
				; And verify the code matches what we expect.
				; CHECK-LABEL: define void @test1(
				entry:
				br label %outer_loop_begin
				; Ensure the outer loop didn't get unswitched.
				; CHECK: entry:
				; CHECK-NEXT: br label %outer_loop_begin

				outer_loop_begin:
				%i = phi i32 [ %i.next, %outer_loop_latch ], [ 0, %entry ]
				; Block unswitching of the outer loop with a noduplicate call.
				call void @f() noduplicate
				br label %inner_loop_begin
				; Ensure the inner loop got unswitched into the outer loop.
				; CHECK: outer_loop_begin:
				; CHECK-NEXT: %{{.*}} = phi i32
				; CHECK-NEXT: call void @f()
				; CHECK-NEXT: br i1 %cond,

				inner_loop_begin:
				%j = phi i32 [ %j.next, %inner_loop_latch ], [ 0, %outer_loop_begin ]
				br i1 %cond, label %inner_loop_latch, label %inner_loop_early_exit

				inner_loop_latch:
				%j.next = add nsw i32 %j, 1
				%j.cmp = icmp slt i32 %j.next, %m
				br i1 %j.cmp, label %inner_loop_begin, label %inner_loop_late_exit

				inner_loop_early_exit:
				%j.lcssa = phi i32 [ %i, %inner_loop_begin ]
				br label %outer_loop_latch

				inner_loop_late_exit:
				br label %outer_loop_latch

				outer_loop_latch:
				%i.phi = phi i32 [ %j.lcssa, %inner_loop_early_exit ], [ %i, %inner_loop_late_exit ]
				%i.next = add nsw i32 %i.phi, 1
				%i.cmp = icmp slt i32 %i.next, %n
				br i1 %i.cmp, label %outer_loop_begin, label %exit

				exit:
				ret void
				}

				; Check that trivially unswitching an inner loop resets both the inner and outer
				; loop trip count.
				define void @test2(i32 %n, i32 %m, i32 %cond) {
				; Check that SCEV has no trip count before unswitching.
				; SCEV-LABEL: Determining loop execution counts for: @test2
				; SCEV: Loop %inner_loop_begin: <multiple exits> Unpredictable backedge-taken count.
				; SCEV: Loop %outer_loop_begin: Unpredictable backedge-taken count.
				;
				; Now check that after unswitching and simplifying instructions we get clean
				; backedge-taken counts.
				; SCEV-LABEL: Determining loop execution counts for: @test2
				; SCEV: Loop %inner_loop_begin: backedge-taken count is (-1 + (1 smax %m))<nsw>
				; FIXME: The following backedge taken count should be known but isn't apparently
				; just because of a switch in the outer loop.
				; SCEV: Loop %outer_loop_begin: Unpredictable backedge-taken count.
				;
				; CHECK-LABEL: define void @test2(
				entry:
				br label %outer_loop_begin
				; Ensure the outer loop didn't get unswitched.
				; CHECK: entry:
				; CHECK-NEXT: br label %outer_loop_begin

				outer_loop_begin:
				%i = phi i32 [ %i.next, %outer_loop_latch ], [ 0, %entry ]
				; Block unswitching of the outer loop with a noduplicate call.
				call void @f() noduplicate
				br label %inner_loop_begin
				; Ensure the inner loop got unswitched into the outer loop.
				; CHECK: outer_loop_begin:
				; CHECK-NEXT: %{{.*}} = phi i32
				; CHECK-NEXT: call void @f()
				; CHECK-NEXT: switch i32 %cond,

				inner_loop_begin:
				%j = phi i32 [ %j.next, %inner_loop_latch ], [ 0, %outer_loop_begin ]
				switch i32 %cond, label %inner_loop_early_exit [
				i32 1, label %inner_loop_latch
				i32 2, label %inner_loop_latch
				]

				inner_loop_latch:
				%j.next = add nsw i32 %j, 1
				%j.cmp = icmp slt i32 %j.next, %m
				br i1 %j.cmp, label %inner_loop_begin, label %inner_loop_late_exit

				inner_loop_early_exit:
				%j.lcssa = phi i32 [ %i, %inner_loop_begin ]
				br label %outer_loop_latch

				inner_loop_late_exit:
				br label %outer_loop_latch

				outer_loop_latch:
				%i.phi = phi i32 [ %j.lcssa, %inner_loop_early_exit ], [ %i, %inner_loop_late_exit ]
				%i.next = add nsw i32 %i.phi, 1
				%i.cmp = icmp slt i32 %i.next, %n
				br i1 %i.cmp, label %outer_loop_begin, label %exit

				exit:
				ret void
				}

				; Check that non-trivial unswitching of a branch in an inner loop into the outer
				; loop invalidates both inner and outer.
				define void @test3(i32 %n, i32 %m, i1 %cond) {
				; Check that SCEV has no trip count before unswitching.
				; SCEV-LABEL: Determining loop execution counts for: @test3
				; SCEV: Loop %inner_loop_begin: <multiple exits> Unpredictable backedge-taken count.
				; SCEV: Loop %outer_loop_begin: Unpredictable backedge-taken count.
				;
				; Now check that after unswitching and simplifying instructions we get clean
				; backedge-taken counts.
				; SCEV-LABEL: Determining loop execution counts for: @test3
				; SCEV: Loop %inner_loop_begin{{.*}}: backedge-taken count is (-1 + (1 smax %m))<nsw>
				; SCEV: Loop %outer_loop_begin: backedge-taken count is (-1 + (1 smax %n))<nsw>
				;
				; And verify the code matches what we expect.
				; CHECK-LABEL: define void @test3(
				entry:
				br label %outer_loop_begin
				; Ensure the outer loop didn't get unswitched.
				; CHECK: entry:
				; CHECK-NEXT: br label %outer_loop_begin

				outer_loop_begin:
				%i = phi i32 [ %i.next, %outer_loop_latch ], [ 0, %entry ]
				; Block unswitching of the outer loop with a noduplicate call.
				call void @f() noduplicate
				br label %inner_loop_begin
				; Ensure the inner loop got unswitched into the outer loop.
				; CHECK: outer_loop_begin:
				; CHECK-NEXT: %{{.*}} = phi i32
				; CHECK-NEXT: call void @f()
				; CHECK-NEXT: br i1 %cond,

				inner_loop_begin:
				%j = phi i32 [ %j.next, %inner_loop_latch ], [ 0, %outer_loop_begin ]
				%j.tmp = add nsw i32 %j, 1
				br i1 %cond, label %inner_loop_latch, label %inner_loop_early_exit

				inner_loop_latch:
				%j.next = add nsw i32 %j, 1
				%j.cmp = icmp slt i32 %j.next, %m
				br i1 %j.cmp, label %inner_loop_begin, label %inner_loop_late_exit

				inner_loop_early_exit:
				%j.lcssa = phi i32 [ %j.tmp, %inner_loop_begin ]
				br label %outer_loop_latch

				inner_loop_late_exit:
				br label %outer_loop_latch

				outer_loop_latch:
				%inc.phi = phi i32 [ %j.lcssa, %inner_loop_early_exit ], [ 1, %inner_loop_late_exit ]
				%i.next = add nsw i32 %i, %inc.phi
				%i.cmp = icmp slt i32 %i.next, %n
				br i1 %i.cmp, label %outer_loop_begin, label %exit

				exit:
				ret void
				}

This is an archive of the discontinued LLVM Phabricator instance.

[PM/LoopUnswitch] Fix PR37651 by correctly invalidating SCEV when unswitching loops.
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 153879

llvm/trunk/lib/Transforms/Scalar/SimpleLoopUnswitch.cpp

llvm/trunk/test/Transforms/SimpleLoopUnswitch/update-scev.ll

This is an archive of the discontinued LLVM Phabricator instance.

[PM/LoopUnswitch] Fix PR37651 by correctly invalidating SCEV when unswitching loops.ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 153879

llvm/trunk/lib/Transforms/Scalar/SimpleLoopUnswitch.cpp

llvm/trunk/test/Transforms/SimpleLoopUnswitch/update-scev.ll

[PM/LoopUnswitch] Fix PR37651 by correctly invalidating SCEV when unswitching loops.
ClosedPublic