Diff 195189

lib/Transforms/Scalar/LoopPredication.cpp

Show First 20 Lines • Show All 172 Lines • ▼ Show 20 Lines
// For uge condition the widened condition is:		// For uge condition the widened condition is:
// guardStart u< guardLimit && latchLimit u> 1.		// guardStart u< guardLimit && latchLimit u> 1.
// For sge condition the widened condition is:		// For sge condition the widened condition is:
// guardStart u< guardLimit && latchLimit s> 1.		// guardStart u< guardLimit && latchLimit s> 1.
//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//

#include "llvm/Transforms/Scalar/LoopPredication.h"		#include "llvm/Transforms/Scalar/LoopPredication.h"
#include "llvm/ADT/Statistic.h"		#include "llvm/ADT/Statistic.h"
		#include "llvm/Analysis/AliasAnalysis.h"
#include "llvm/Analysis/BranchProbabilityInfo.h"		#include "llvm/Analysis/BranchProbabilityInfo.h"
#include "llvm/Analysis/GuardUtils.h"		#include "llvm/Analysis/GuardUtils.h"
#include "llvm/Analysis/LoopInfo.h"		#include "llvm/Analysis/LoopInfo.h"
#include "llvm/Analysis/LoopPass.h"		#include "llvm/Analysis/LoopPass.h"
#include "llvm/Analysis/ScalarEvolution.h"		#include "llvm/Analysis/ScalarEvolution.h"
#include "llvm/Analysis/ScalarEvolutionExpander.h"		#include "llvm/Analysis/ScalarEvolutionExpander.h"
#include "llvm/Analysis/ScalarEvolutionExpressions.h"		#include "llvm/Analysis/ScalarEvolutionExpressions.h"
#include "llvm/IR/Function.h"		#include "llvm/IR/Function.h"
▲ Show 20 Lines • Show All 52 Lines • ▼ Show 20 Lines	LoopICmp(ICmpInst::Predicate Pred, const SCEVAddRecExpr *IV,
: Pred(Pred), IV(IV), Limit(Limit) {}		: Pred(Pred), IV(IV), Limit(Limit) {}
LoopICmp() {}		LoopICmp() {}
void dump() {		void dump() {
dbgs() << "LoopICmp Pred = " << Pred << ", IV = " << *IV		dbgs() << "LoopICmp Pred = " << Pred << ", IV = " << *IV
<< ", Limit = " << *Limit << "\n";		<< ", Limit = " << *Limit << "\n";
}		}
};		};

		AliasAnalysis *AA;
ScalarEvolution *SE;		ScalarEvolution *SE;
BranchProbabilityInfo *BPI;		BranchProbabilityInfo *BPI;

Loop *L;		Loop *L;
const DataLayout *DL;		const DataLayout *DL;
BasicBlock *Preheader;		BasicBlock *Preheader;
LoopICmp LatchCheck;		LoopICmp LatchCheck;

bool isSupportedStep(const SCEV* Step);		bool isSupportedStep(const SCEV* Step);
Optional<LoopICmp> parseLoopICmp(ICmpInst *ICI) {		Optional<LoopICmp> parseLoopICmp(ICmpInst *ICI) {
return parseLoopICmp(ICI->getPredicate(), ICI->getOperand(0),		return parseLoopICmp(ICI->getPredicate(), ICI->getOperand(0),
ICI->getOperand(1));		ICI->getOperand(1));
}		}
Optional<LoopICmp> parseLoopICmp(ICmpInst::Predicate Pred, Value *LHS,		Optional<LoopICmp> parseLoopICmp(ICmpInst::Predicate Pred, Value *LHS,
Value *RHS);		Value *RHS);

Optional<LoopICmp> parseLoopLatchICmp();		Optional<LoopICmp> parseLoopLatchICmp();

bool CanExpand(const SCEV* S);		bool CanExpand(const SCEV* S, const Instruction *At);
Value *expandCheck(SCEVExpander &Expander, IRBuilder<> &Builder,		Value *expandCheck(SCEVExpander &Expander, IRBuilder<> &Builder,
ICmpInst::Predicate Pred, const SCEV *LHS,		ICmpInst::Predicate Pred, const SCEV *LHS,
const SCEV *RHS);		const SCEV *RHS);

Optional<Value > widenICmpRangeCheck(ICmpInst ICI, SCEVExpander &Expander,		Optional<Value > widenICmpRangeCheck(ICmpInst ICI, SCEVExpander &Expander,
IRBuilder<> &Builder);		IRBuilder<> &Builder);
Optional<Value *> widenICmpRangeCheckIncrementingLoop(LoopICmp LatchCheck,		Optional<Value *> widenICmpRangeCheckIncrementingLoop(LoopICmp LatchCheck,
LoopICmp RangeCheck,		LoopICmp RangeCheck,
Show All 26 Lines	class LoopPredication {
// This function returns true if we can safely represent the IV type in		// This function returns true if we can safely represent the IV type in
// the RangeCheckType without loss of information.		// the RangeCheckType without loss of information.
bool isSafeToTruncateWideIVType(Type *RangeCheckType);		bool isSafeToTruncateWideIVType(Type *RangeCheckType);
// Return the loopLatchCheck corresponding to the RangeCheckType if safe to do		// Return the loopLatchCheck corresponding to the RangeCheckType if safe to do
// so.		// so.
Optional<LoopICmp> generateLoopLatchCheck(Type *RangeCheckType);		Optional<LoopICmp> generateLoopLatchCheck(Type *RangeCheckType);

public:		public:
LoopPredication(ScalarEvolution SE, BranchProbabilityInfo BPI)		LoopPredication(AliasAnalysis AA, ScalarEvolution SE,
: SE(SE), BPI(BPI){};		BranchProbabilityInfo *BPI)
		: AA(AA), SE(SE), BPI(BPI){};
bool runOnLoop(Loop *L);		bool runOnLoop(Loop *L);
};		};

class LoopPredicationLegacyPass : public LoopPass {		class LoopPredicationLegacyPass : public LoopPass {
public:		public:
static char ID;		static char ID;
LoopPredicationLegacyPass() : LoopPass(ID) {		LoopPredicationLegacyPass() : LoopPass(ID) {
initializeLoopPredicationLegacyPassPass(*PassRegistry::getPassRegistry());		initializeLoopPredicationLegacyPassPass(*PassRegistry::getPassRegistry());
}		}

void getAnalysisUsage(AnalysisUsage &AU) const override {		void getAnalysisUsage(AnalysisUsage &AU) const override {
AU.addRequired<BranchProbabilityInfoWrapperPass>();		AU.addRequired<BranchProbabilityInfoWrapperPass>();
getLoopAnalysisUsage(AU);		getLoopAnalysisUsage(AU);
}		}

bool runOnLoop(Loop *L, LPPassManager &LPM) override {		bool runOnLoop(Loop *L, LPPassManager &LPM) override {
if (skipLoop(L))		if (skipLoop(L))
return false;		return false;
auto *SE = &getAnalysis<ScalarEvolutionWrapperPass>().getSE();		auto *SE = &getAnalysis<ScalarEvolutionWrapperPass>().getSE();
BranchProbabilityInfo &BPI =		BranchProbabilityInfo &BPI =
getAnalysis<BranchProbabilityInfoWrapperPass>().getBPI();		getAnalysis<BranchProbabilityInfoWrapperPass>().getBPI();
LoopPredication LP(SE, &BPI);		auto *AA = &getAnalysis<AAResultsWrapperPass>().getAAResults();
		LoopPredication LP(AA, SE, &BPI);
return LP.runOnLoop(L);		return LP.runOnLoop(L);
}		}
};		};

char LoopPredicationLegacyPass::ID = 0;		char LoopPredicationLegacyPass::ID = 0;
} // end namespace llvm		} // end namespace llvm

INITIALIZE_PASS_BEGIN(LoopPredicationLegacyPass, "loop-predication",		INITIALIZE_PASS_BEGIN(LoopPredicationLegacyPass, "loop-predication",
Show All 9 Lines

PreservedAnalyses LoopPredicationPass::run(Loop &L, LoopAnalysisManager &AM,		PreservedAnalyses LoopPredicationPass::run(Loop &L, LoopAnalysisManager &AM,
LoopStandardAnalysisResults &AR,		LoopStandardAnalysisResults &AR,
LPMUpdater &U) {		LPMUpdater &U) {
const auto &FAM =		const auto &FAM =
AM.getResult<FunctionAnalysisManagerLoopProxy>(L, AR).getManager();		AM.getResult<FunctionAnalysisManagerLoopProxy>(L, AR).getManager();
Function *F = L.getHeader()->getParent();		Function *F = L.getHeader()->getParent();
auto BPI = FAM.getCachedResult<BranchProbabilityAnalysis>(F);		auto BPI = FAM.getCachedResult<BranchProbabilityAnalysis>(F);
LoopPredication LP(&AR.SE, BPI);		LoopPredication LP(&AR.AA, &AR.SE, BPI);
if (!LP.runOnLoop(&L))		if (!LP.runOnLoop(&L))
return PreservedAnalyses::all();		return PreservedAnalyses::all();

return getLoopPassPreservedAnalyses();		return getLoopPassPreservedAnalyses();
}		}

Optional<LoopPredication::LoopICmp>		Optional<LoopPredication::LoopICmp>
LoopPredication::parseLoopICmp(ICmpInst::Predicate Pred, Value *LHS,		LoopPredication::parseLoopICmp(ICmpInst::Predicate Pred, Value *LHS,
Show All 21 Lines

Value *LoopPredication::expandCheck(SCEVExpander &Expander,		Value *LoopPredication::expandCheck(SCEVExpander &Expander,
IRBuilder<> &Builder,		IRBuilder<> &Builder,
ICmpInst::Predicate Pred, const SCEV *LHS,		ICmpInst::Predicate Pred, const SCEV *LHS,
const SCEV *RHS) {		const SCEV *RHS) {
Type *Ty = LHS->getType();		Type *Ty = LHS->getType();
assert(Ty == RHS->getType() && "expandCheck operands have different types?");		assert(Ty == RHS->getType() && "expandCheck operands have different types?");

		const bool OpsAreLoopInvariant =
		SE->isLoopInvariant(LHS, L) && SE->isLoopInvariant(RHS, L);
		if (OpsAreLoopInvariant) {
if (SE->isLoopEntryGuardedByCond(L, Pred, LHS, RHS))		if (SE->isLoopEntryGuardedByCond(L, Pred, LHS, RHS))
return Builder.getTrue();		return Builder.getTrue();
if (SE->isLoopEntryGuardedByCond(L, ICmpInst::getInversePredicate(Pred),		if (SE->isLoopEntryGuardedByCond(L, ICmpInst::getInversePredicate(Pred),
LHS, RHS))		LHS, RHS))
return Builder.getFalse();		return Builder.getFalse();
		}
		apilipenkoUnsubmitted Not Done Reply Inline Actions Nit. Extract `SE->isLoopInvariant(LHS, L) && SE->isLoopInvariant(RHS, L)` into a local variable? You check it below as well. apilipenko: Nit. Extract `SE->isLoopInvariant(LHS, L) && SE->isLoopInvariant(RHS, L)` into a local variable?

Instruction InsertAt = &Builder.GetInsertPoint();		Instruction * const InsertAt = OpsAreLoopInvariant ?
		Preheader->getTerminator() : &*Builder.GetInsertPoint();
Value *LHSV = Expander.expandCodeFor(LHS, Ty, InsertAt);		Value *LHSV = Expander.expandCodeFor(LHS, Ty, InsertAt);
		apilipenkoUnsubmitted Not Done Reply Inline Actions You can use `Preheader` cached in the field. apilipenko: You can use `Preheader` cached in the field.
Value *RHSV = Expander.expandCodeFor(RHS, Ty, InsertAt);		Value *RHSV = Expander.expandCodeFor(RHS, Ty, InsertAt);
		IRBuilder<>::InsertPointGuard G(Builder);
		Builder.SetInsertPoint(InsertAt);
return Builder.CreateICmp(Pred, LHSV, RHSV);		return Builder.CreateICmp(Pred, LHSV, RHSV);
}		}

Optional<LoopPredication::LoopICmp>		Optional<LoopPredication::LoopICmp>
LoopPredication::generateLoopLatchCheck(Type *RangeCheckType) {		LoopPredication::generateLoopLatchCheck(Type *RangeCheckType) {

auto *LatchType = LatchCheck.IV->getType();		auto *LatchType = LatchCheck.IV->getType();
if (RangeCheckType == LatchType)		if (RangeCheckType == LatchType)
Show All 19 Lines	LoopPredication::generateLoopLatchCheck(Type *RangeCheckType) {
LLVM_DEBUG(dbgs() << "LatchCheck.Limit: " << *NewLatchCheck.Limit << "\n");		LLVM_DEBUG(dbgs() << "LatchCheck.Limit: " << *NewLatchCheck.Limit << "\n");
return NewLatchCheck;		return NewLatchCheck;
}		}

bool LoopPredication::isSupportedStep(const SCEV* Step) {		bool LoopPredication::isSupportedStep(const SCEV* Step) {
return Step->isOne() \|\| (Step->isAllOnesValue() && EnableCountDownLoop);		return Step->isOne() \|\| (Step->isAllOnesValue() && EnableCountDownLoop);
}		}

bool LoopPredication::CanExpand(const SCEV* S) {		bool LoopPredication::CanExpand(const SCEV* S, const Instruction *At) {
		apilipenkoUnsubmitted Not Done Reply Inline Actions Am I right that this is not specific to the change you make and just a fix for an existing bug? If so, can be integrated separately with a test demonstrating the problem. apilipenko: Am I right that this is not specific to the change you make and just a fix for an existing bug?
		reamesAuthorUnsubmitted Done Reply Inline Actions You are correct, and I'd completely missed that when writing. Will do! reames: You are correct, and I'd completely missed that when writing. Will do!
		reamesAuthorUnsubmitted Done Reply Inline Actions Actually, no. On further reflection, this is a silent bug without the rest of this change. All of the operands to the expressions we call this on have previously been checked via isSafeToSpeculate. It's only with this change that we weaken that precondition and expose the latent issue. Given that, I'm not going to submit this separately. reames: Actually, no. On further reflection, this is a silent bug without the rest of this change.
return SE->isLoopInvariant(S, L) && isSafeToExpand(S, *SE);		if (SE->isLoopInvariant(S, L) && isSafeToExpand(S, *SE))
		return true;

		// Handling expressions which produce invariant results, but haven't yet
		// been removed from the loop serves two important purposes.
		// 1) Most importantly, it resolves a pass ordering cycle which would
		// otherwise need us to iteration licm, loop-predication, and either
		// loop-unswitch or loop-peeling to make progress on examples with lots of
		// predicable range checks in a row. (Since, in the general case, we can't
		// hoist the length checks until the dominating checks have been discharged
		// as we can't prove doing so is safe.)
		// 2) As a nice side effect, this exposes the value of peeling or unswitching
		// much more obviously in the IR. Otherwise, the cost modeling for other
		// transforms would end up needing to duplicate all of this logic to model a
		// check which becomes predictable based on a modeled peel or unswitch.
		//
		// The cost of doing so in the worst case is an extra load in the loop to
		// materialize the loop invariant test value instead of checking against the
		// original IV which is presumable in a register inside the loop. Such cases
		// are presumably rare, and hint at missing oppurtunities for other passes.
		if (const SCEVUnknown *U = dyn_cast<SCEVUnknown>(S))
		apilipenkoUnsubmitted Not Done Reply Inline Actions Debug printing. apilipenko: Debug printing.
		if (const auto *LI = dyn_cast<LoadInst>(U->getValue())) {
		if (!LI->isUnordered())
		return false;
		if (AA->pointsToConstantMemory(LI->getOperand(0)) \|\|
		LI->getMetadata(LLVMContext::MD_invariant_load) != nullptr)
		return isSafeToExpandAt(S, At, *SE);
		}
		return false;
}		}

Optional<Value *> LoopPredication::widenICmpRangeCheckIncrementingLoop(		Optional<Value *> LoopPredication::widenICmpRangeCheckIncrementingLoop(
LoopPredication::LoopICmp LatchCheck, LoopPredication::LoopICmp RangeCheck,		LoopPredication::LoopICmp LatchCheck, LoopPredication::LoopICmp RangeCheck,
SCEVExpander &Expander, IRBuilder<> &Builder) {		SCEVExpander &Expander, IRBuilder<> &Builder) {
auto *Ty = RangeCheck.IV->getType();		auto *Ty = RangeCheck.IV->getType();
// Generate the widened condition for the forward loop:		// Generate the widened condition for the forward loop:
// guardStart u< guardLimit &&		// guardStart u< guardLimit &&
// latchLimit <pred> guardLimit - 1 - guardStart + latchStart		// latchLimit <pred> guardLimit - 1 - guardStart + latchStart
// where <pred> depends on the latch condition predicate. See the file		// where <pred> depends on the latch condition predicate. See the file
// header comment for the reasoning.		// header comment for the reasoning.
// guardLimit - guardStart + latchStart - 1		// guardLimit - guardStart + latchStart - 1
const SCEV *GuardStart = RangeCheck.IV->getStart();		const SCEV *GuardStart = RangeCheck.IV->getStart();
const SCEV *GuardLimit = RangeCheck.Limit;		const SCEV *GuardLimit = RangeCheck.Limit;
const SCEV *LatchStart = LatchCheck.IV->getStart();		const SCEV *LatchStart = LatchCheck.IV->getStart();
const SCEV *LatchLimit = LatchCheck.Limit;		const SCEV *LatchLimit = LatchCheck.Limit;

// guardLimit - guardStart + latchStart - 1		// guardLimit - guardStart + latchStart - 1
const SCEV *RHS =		const SCEV *RHS =
		apilipenkoUnsubmitted Not Done Reply Inline Actions Can we assert isSafeToExpandAt for the values we don't check? apilipenko: Can we assert isSafeToExpandAt for the values we don't check?
		reamesAuthorUnsubmitted Done Reply Inline Actions No we can't. That's the entire point of not checking. The basic structure here is that isSafeToExpand guarantees expansion is safe, but a false return value can still be safe to expand. In this case, we use information about dominance of the original conditions in the IR to ensure safety of these two. reames: No we can't. That's the entire point of not checking. The basic structure here is that…
SE->getAddExpr(SE->getMinusSCEV(GuardLimit, GuardStart),		SE->getAddExpr(SE->getMinusSCEV(GuardLimit, GuardStart),
SE->getMinusSCEV(LatchStart, SE->getOne(Ty)));		SE->getMinusSCEV(LatchStart, SE->getOne(Ty)));
if (!CanExpand(GuardStart) \|\| !CanExpand(GuardLimit) \|\|		Instruction InsertAt = &Builder.GetInsertPoint();
!CanExpand(LatchLimit) \|\| !CanExpand(RHS)) {		Instruction *PHTerm = Preheader->getTerminator();
		if (!CanExpand(GuardStart, PHTerm) \|\| !CanExpand(GuardLimit, InsertAt) \|\|
		!CanExpand(LatchLimit, PHTerm) \|\| !CanExpand(RHS, InsertAt)) {
LLVM_DEBUG(dbgs() << "Can't expand limit check!\n");		LLVM_DEBUG(dbgs() << "Can't expand limit check!\n");
return None;		return None;
}		}
auto LimitCheckPred =		auto LimitCheckPred =
ICmpInst::getFlippedStrictnessPredicate(LatchCheck.Pred);		ICmpInst::getFlippedStrictnessPredicate(LatchCheck.Pred);

LLVM_DEBUG(dbgs() << "LHS: " << *LatchLimit << "\n");		LLVM_DEBUG(dbgs() << "LHS: " << *LatchLimit << "\n");
LLVM_DEBUG(dbgs() << "RHS: " << *RHS << "\n");		LLVM_DEBUG(dbgs() << "RHS: " << *RHS << "\n");
LLVM_DEBUG(dbgs() << "Pred: " << LimitCheckPred << "\n");		LLVM_DEBUG(dbgs() << "Pred: " << LimitCheckPred << "\n");

auto *LimitCheck =		auto *LimitCheck =
		apilipenkoUnsubmitted Not Done Reply Inline Actions These changes look correct to me, but there are actually a couple of NFC refactorings (replacing CanExpand(RHS) with CanExpand(LatchStart), inlining CanExpand, removing isSafeToExpandAt checks for GuardStart, GuardLimit) mixed with a functional change to use isLoopInvariantValue instead of SE->isLoopInvariant. You might want to split these when integrating to make bisecting easier. apilipenko: These changes look correct to me, but there are actually a couple of NFC refactorings…
		reamesAuthorUnsubmitted Done Reply Inline Actions I thought about it, but explaining the NFC part without context seemed challenging. So I left them together. reames: I thought about it, but explaining the NFC part without context seemed challenging. So I left…
expandCheck(Expander, Builder, LimitCheckPred, LatchLimit, RHS);		expandCheck(Expander, Builder, LimitCheckPred, LatchLimit, RHS);
auto *FirstIterationCheck = expandCheck(Expander, Builder, RangeCheck.Pred,		auto *FirstIterationCheck = expandCheck(Expander, Builder, RangeCheck.Pred,
GuardStart, GuardLimit);		GuardStart, GuardLimit);
		if (L->isLoopInvariant(LimitCheck) && L->isLoopInvariant(FirstIterationCheck))
		InsertAt = Preheader->getTerminator();
		IRBuilder<>::InsertPointGuard G(Builder);
		Builder.SetInsertPoint(InsertAt);
return Builder.CreateAnd(FirstIterationCheck, LimitCheck);		return Builder.CreateAnd(FirstIterationCheck, LimitCheck);
}		}

Optional<Value *> LoopPredication::widenICmpRangeCheckDecrementingLoop(		Optional<Value *> LoopPredication::widenICmpRangeCheckDecrementingLoop(
LoopPredication::LoopICmp LatchCheck, LoopPredication::LoopICmp RangeCheck,		LoopPredication::LoopICmp LatchCheck, LoopPredication::LoopICmp RangeCheck,
SCEVExpander &Expander, IRBuilder<> &Builder) {		SCEVExpander &Expander, IRBuilder<> &Builder) {
auto *Ty = RangeCheck.IV->getType();		auto *Ty = RangeCheck.IV->getType();
const SCEV *GuardStart = RangeCheck.IV->getStart();		const SCEV *GuardStart = RangeCheck.IV->getStart();
const SCEV *GuardLimit = RangeCheck.Limit;		const SCEV *GuardLimit = RangeCheck.Limit;
const SCEV *LatchLimit = LatchCheck.Limit;		const SCEV *LatchLimit = LatchCheck.Limit;
if (!CanExpand(GuardStart) \|\| !CanExpand(GuardLimit) \|\|		Instruction InsertAt = &Builder.GetInsertPoint();
!CanExpand(LatchLimit)) {		if (!CanExpand(GuardStart, InsertAt) \|\| !CanExpand(GuardLimit, InsertAt) \|\|
		!CanExpand(LatchLimit, InsertAt)) {
LLVM_DEBUG(dbgs() << "Can't expand limit check!\n");		LLVM_DEBUG(dbgs() << "Can't expand limit check!\n");
return None;		return None;
}		}
// The decrement of the latch check IV should be the same as the		// The decrement of the latch check IV should be the same as the
// rangeCheckIV.		// rangeCheckIV.
auto PostDecLatchCheckIV = LatchCheck.IV->getPostIncExpr(SE);		auto PostDecLatchCheckIV = LatchCheck.IV->getPostIncExpr(SE);
if (RangeCheck.IV != PostDecLatchCheckIV) {		if (RangeCheck.IV != PostDecLatchCheckIV) {
LLVM_DEBUG(dbgs() << "Not the same. PostDecLatchCheckIV: "		LLVM_DEBUG(dbgs() << "Not the same. PostDecLatchCheckIV: "
<< *PostDecLatchCheckIV		<< *PostDecLatchCheckIV
<< " and RangeCheckIV: " << *RangeCheck.IV << "\n");		<< " and RangeCheckIV: " << *RangeCheck.IV << "\n");
return None;		return None;
}		}

// Generate the widened condition for CountDownLoop:		// Generate the widened condition for CountDownLoop:
// guardStart u< guardLimit &&		// guardStart u< guardLimit &&
// latchLimit <pred> 1.		// latchLimit <pred> 1.
// See the header comment for reasoning of the checks.		// See the header comment for reasoning of the checks.
auto LimitCheckPred =		auto LimitCheckPred =
ICmpInst::getFlippedStrictnessPredicate(LatchCheck.Pred);		ICmpInst::getFlippedStrictnessPredicate(LatchCheck.Pred);
auto *FirstIterationCheck = expandCheck(Expander, Builder, ICmpInst::ICMP_ULT,		auto *FirstIterationCheck = expandCheck(Expander, Builder, ICmpInst::ICMP_ULT,
GuardStart, GuardLimit);		GuardStart, GuardLimit);
auto *LimitCheck = expandCheck(Expander, Builder, LimitCheckPred, LatchLimit,		auto *LimitCheck = expandCheck(Expander, Builder, LimitCheckPred, LatchLimit,
SE->getOne(Ty));		SE->getOne(Ty));
		if (L->isLoopInvariant(LimitCheck) && L->isLoopInvariant(FirstIterationCheck))
		InsertAt = Preheader->getTerminator();
		IRBuilder<>::InsertPointGuard G(Builder);
		Builder.SetInsertPoint(InsertAt);
return Builder.CreateAnd(FirstIterationCheck, LimitCheck);		return Builder.CreateAnd(FirstIterationCheck, LimitCheck);
}		}

/// If ICI can be widened to a loop invariant condition emits the loop		/// If ICI can be widened to a loop invariant condition emits the loop
/// invariant condition in the loop preheader and return it, otherwise		/// invariant condition in the loop preheader and return it, otherwise
/// returns None.		/// returns None.
Optional<Value > LoopPredication::widenICmpRangeCheck(ICmpInst ICI,		Optional<Value > LoopPredication::widenICmpRangeCheck(ICmpInst ICI,
SCEVExpander &Expander,		SCEVExpander &Expander,
▲ Show 20 Lines • Show All 58 Lines • ▼ Show 20 Lines	return widenICmpRangeCheckDecrementingLoop(CurrLatchCheck, *RangeCheck,
Expander, Builder);		Expander, Builder);
}		}
}		}

unsigned LoopPredication::collectChecks(SmallVectorImpl<Value *> &Checks,		unsigned LoopPredication::collectChecks(SmallVectorImpl<Value *> &Checks,
Value *Condition,		Value *Condition,
SCEVExpander &Expander,		SCEVExpander &Expander,
IRBuilder<> &Builder) {		IRBuilder<> &Builder) {
		IRBuilder<>::InsertPointGuard G(Builder);
unsigned NumWidened = 0;		unsigned NumWidened = 0;
// The guard condition is expected to be in form of:		// The guard condition is expected to be in form of:
// cond1 && cond2 && cond3 ...		// cond1 && cond2 && cond3 ...
// Iterate over subconditions looking for icmp conditions which can be		// Iterate over subconditions looking for icmp conditions which can be
// widened across loop iterations. Widening these conditions remember the		// widened across loop iterations. Widening these conditions remember the
// resulting list of subconditions in Checks vector.		// resulting list of subconditions in Checks vector.
SmallVector<Value *, 4> Worklist(1, Condition);		SmallVector<Value *, 4> Worklist(1, Condition);
SmallPtrSet<Value *, 4> Visited;		SmallPtrSet<Value *, 4> Visited;
Show All 14 Lines	do {
if (match(Condition,		if (match(Condition,
m_Intrinsic<Intrinsic::experimental_widenable_condition>())) {		m_Intrinsic<Intrinsic::experimental_widenable_condition>())) {
// Pick any, we don't care which		// Pick any, we don't care which
WideableCond = Condition;		WideableCond = Condition;
continue;		continue;
}		}

if (ICmpInst *ICI = dyn_cast<ICmpInst>(Condition)) {		if (ICmpInst *ICI = dyn_cast<ICmpInst>(Condition)) {
		IRBuilder<>::InsertPointGuard G(Builder);
		Builder.SetInsertPoint(ICI);
if (auto NewRangeCheck = widenICmpRangeCheck(ICI, Expander,		if (auto NewRangeCheck = widenICmpRangeCheck(ICI, Expander,
Builder)) {		Builder)) {
Checks.push_back(NewRangeCheck.getValue());		Checks.push_back(NewRangeCheck.getValue());
NumWidened++;		NumWidened++;
continue;		continue;
}		}
}		}

▲ Show 20 Lines • Show All 277 Lines • ▼ Show 20 Lines	bool LoopPredication::runOnLoop(Loop *Loop) {
SCEVExpander Expander(SE, DL, "loop-predication");		SCEVExpander Expander(SE, DL, "loop-predication");

bool Changed = false;		bool Changed = false;
for (auto *Guard : Guards)		for (auto *Guard : Guards)
Changed \|= widenGuardConditions(Guard, Expander);		Changed \|= widenGuardConditions(Guard, Expander);
for (auto *Guard : GuardsAsWidenableBranches)		for (auto *Guard : GuardsAsWidenableBranches)
Changed \|= widenWidenableBranchGuardConditions(Guard, Expander);		Changed \|= widenWidenableBranchGuardConditions(Guard, Expander);

return Changed;		return Changed;
		apilipenkoUnsubmitted Not Done Reply Inline Actions Debug printing. apilipenko: Debug printing.
		reamesAuthorUnsubmitted Done Reply Inline Actions Oops, good catch, thanks. reames: Oops, good catch, thanks.
}		}

test/Transforms/LoopPredication/invariant_load.ll

	Show First 20 Lines • Show All 72 Lines • ▼ Show 20 Lines
	; CHECK: loop.preheader:			; CHECK: loop.preheader:
	; CHECK-NEXT: br label [[LOOP:%.*]]			; CHECK-NEXT: br label [[LOOP:%.*]]
	; CHECK: loop:			; CHECK: loop:
	; CHECK-NEXT: [[LOOP_ACC:%.]] = phi i32 [ [[LOOP_ACC_NEXT:%.]], [[LOOP]] ], [ 0, [[LOOP_PREHEADER]] ]			; CHECK-NEXT: [[LOOP_ACC:%.]] = phi i32 [ [[LOOP_ACC_NEXT:%.]], [[LOOP]] ], [ 0, [[LOOP_PREHEADER]] ]
	; CHECK-NEXT: [[I:%.]] = phi i32 [ [[I_NEXT:%.]], [[LOOP]] ], [ 0, [[LOOP_PREHEADER]] ]			; CHECK-NEXT: [[I:%.]] = phi i32 [ [[I_NEXT:%.]], [[LOOP]] ], [ 0, [[LOOP_PREHEADER]] ]
	; CHECK-NEXT: [[UNKNOWN:%.]] = load volatile i1, i1 @UNKNOWN			; CHECK-NEXT: [[UNKNOWN:%.]] = load volatile i1, i1 @UNKNOWN
	; CHECK-NEXT: call void (i1, ...) @llvm.experimental.guard(i1 [[UNKNOWN]]) [ "deopt"() ]			; CHECK-NEXT: call void (i1, ...) @llvm.experimental.guard(i1 [[UNKNOWN]]) [ "deopt"() ]
	; CHECK-NEXT: [[LEN:%.]] = load i32, i32 [[LENGTH:%.*]], align 4, !invariant.load !0			; CHECK-NEXT: [[LEN:%.]] = load i32, i32 [[LENGTH:%.*]], align 4, !invariant.load !0
	; CHECK-NEXT: [[WITHIN_BOUNDS:%.*]] = icmp ult i32 [[I]], [[LEN]]			; CHECK-NEXT: [[TMP0:%.*]] = icmp ule i32 [[N]], [[LEN]]
	; CHECK-NEXT: call void (i1, ...) @llvm.experimental.guard(i1 [[WITHIN_BOUNDS]], i32 9) [ "deopt"() ]			; CHECK-NEXT: [[TMP1:%.*]] = icmp ult i32 0, [[LEN]]
				; CHECK-NEXT: [[TMP2:%.*]] = and i1 [[TMP1]], [[TMP0]]
				; CHECK-NEXT: call void (i1, ...) @llvm.experimental.guard(i1 [[TMP2]], i32 9) [ "deopt"() ]
	; CHECK-NEXT: [[I_I64:%.*]] = zext i32 [[I]] to i64			; CHECK-NEXT: [[I_I64:%.*]] = zext i32 [[I]] to i64
	; CHECK-NEXT: [[ARRAY_I_PTR:%.]] = getelementptr inbounds i32, i32 [[ARRAY:%.*]], i64 [[I_I64]]			; CHECK-NEXT: [[ARRAY_I_PTR:%.]] = getelementptr inbounds i32, i32 [[ARRAY:%.*]], i64 [[I_I64]]
	; CHECK-NEXT: [[ARRAY_I:%.]] = load i32, i32 [[ARRAY_I_PTR]], align 4			; CHECK-NEXT: [[ARRAY_I:%.]] = load i32, i32 [[ARRAY_I_PTR]], align 4
	; CHECK-NEXT: [[LOOP_ACC_NEXT]] = add i32 [[LOOP_ACC]], [[ARRAY_I]]			; CHECK-NEXT: [[LOOP_ACC_NEXT]] = add i32 [[LOOP_ACC]], [[ARRAY_I]]
	; CHECK-NEXT: [[I_NEXT]] = add nuw i32 [[I]], 1			; CHECK-NEXT: [[I_NEXT]] = add nuw i32 [[I]], 1
	; CHECK-NEXT: [[CONTINUE:%.*]] = icmp ult i32 [[I_NEXT]], [[N]]			; CHECK-NEXT: [[CONTINUE:%.*]] = icmp ult i32 [[I_NEXT]], [[N]]
	; CHECK-NEXT: br i1 [[CONTINUE]], label [[LOOP]], label [[EXIT_LOOPEXIT:%.*]]			; CHECK-NEXT: br i1 [[CONTINUE]], label [[LOOP]], label [[EXIT_LOOPEXIT:%.*]]
	; CHECK: exit.loopexit:			; CHECK: exit.loopexit:
	▲ Show 20 Lines • Show All 43 Lines • ▼ Show 20 Lines
	; CHECK: loop.preheader:			; CHECK: loop.preheader:
	; CHECK-NEXT: br label [[LOOP:%.*]]			; CHECK-NEXT: br label [[LOOP:%.*]]
	; CHECK: loop:			; CHECK: loop:
	; CHECK-NEXT: [[LOOP_ACC:%.]] = phi i32 [ [[LOOP_ACC_NEXT:%.]], [[LOOP]] ], [ 0, [[LOOP_PREHEADER]] ]			; CHECK-NEXT: [[LOOP_ACC:%.]] = phi i32 [ [[LOOP_ACC_NEXT:%.]], [[LOOP]] ], [ 0, [[LOOP_PREHEADER]] ]
	; CHECK-NEXT: [[I:%.]] = phi i32 [ [[I_NEXT:%.]], [[LOOP]] ], [ 0, [[LOOP_PREHEADER]] ]			; CHECK-NEXT: [[I:%.]] = phi i32 [ [[I_NEXT:%.]], [[LOOP]] ], [ 0, [[LOOP_PREHEADER]] ]
	; CHECK-NEXT: [[UNKNOWN:%.]] = load volatile i1, i1 @UNKNOWN			; CHECK-NEXT: [[UNKNOWN:%.]] = load volatile i1, i1 @UNKNOWN
	; CHECK-NEXT: call void (i1, ...) @llvm.experimental.guard(i1 [[UNKNOWN]]) [ "deopt"() ]			; CHECK-NEXT: call void (i1, ...) @llvm.experimental.guard(i1 [[UNKNOWN]]) [ "deopt"() ]
	; CHECK-NEXT: [[LEN:%.]] = load i32, i32 @Length, align 4			; CHECK-NEXT: [[LEN:%.]] = load i32, i32 @Length, align 4
	; CHECK-NEXT: [[WITHIN_BOUNDS:%.*]] = icmp ult i32 [[I]], [[LEN]]			; CHECK-NEXT: [[TMP0:%.*]] = icmp ule i32 [[N]], [[LEN]]
	; CHECK-NEXT: call void (i1, ...) @llvm.experimental.guard(i1 [[WITHIN_BOUNDS]], i32 9) [ "deopt"() ]			; CHECK-NEXT: [[TMP1:%.*]] = icmp ult i32 0, [[LEN]]
				; CHECK-NEXT: [[TMP2:%.*]] = and i1 [[TMP1]], [[TMP0]]
				; CHECK-NEXT: call void (i1, ...) @llvm.experimental.guard(i1 [[TMP2]], i32 9) [ "deopt"() ]
	; CHECK-NEXT: [[I_I64:%.*]] = zext i32 [[I]] to i64			; CHECK-NEXT: [[I_I64:%.*]] = zext i32 [[I]] to i64
	; CHECK-NEXT: [[ARRAY_I_PTR:%.]] = getelementptr inbounds i32, i32 [[ARRAY:%.*]], i64 [[I_I64]]			; CHECK-NEXT: [[ARRAY_I_PTR:%.]] = getelementptr inbounds i32, i32 [[ARRAY:%.*]], i64 [[I_I64]]
	; CHECK-NEXT: [[ARRAY_I:%.]] = load i32, i32 [[ARRAY_I_PTR]], align 4			; CHECK-NEXT: [[ARRAY_I:%.]] = load i32, i32 [[ARRAY_I_PTR]], align 4
	; CHECK-NEXT: [[LOOP_ACC_NEXT]] = add i32 [[LOOP_ACC]], [[ARRAY_I]]			; CHECK-NEXT: [[LOOP_ACC_NEXT]] = add i32 [[LOOP_ACC]], [[ARRAY_I]]
	; CHECK-NEXT: [[I_NEXT]] = add nuw i32 [[I]], 1			; CHECK-NEXT: [[I_NEXT]] = add nuw i32 [[I]], 1
	; CHECK-NEXT: [[CONTINUE:%.*]] = icmp ult i32 [[I_NEXT]], [[N]]			; CHECK-NEXT: [[CONTINUE:%.*]] = icmp ult i32 [[I_NEXT]], [[N]]
	; CHECK-NEXT: br i1 [[CONTINUE]], label [[LOOP]], label [[EXIT_LOOPEXIT:%.*]]			; CHECK-NEXT: br i1 [[CONTINUE]], label [[LOOP]], label [[EXIT_LOOPEXIT:%.*]]
	; CHECK: exit.loopexit:			; CHECK: exit.loopexit:
	▲ Show 20 Lines • Show All 95 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[LoopPredication] Allow predication of loop invariant computations
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 195189

lib/Transforms/Scalar/LoopPredication.cpp

test/Transforms/LoopPredication/invariant_load.ll

This is an archive of the discontinued LLVM Phabricator instance.

[LoopPredication] Allow predication of loop invariant computationsClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 195189

lib/Transforms/Scalar/LoopPredication.cpp

test/Transforms/LoopPredication/invariant_load.ll

[LoopPredication] Allow predication of loop invariant computations
ClosedPublic