Diff 138927

lib/Transforms/Scalar/CallSiteSplitting.cpp

Show First 20 Lines • Show All 139 Lines • ▼ Show 20 Lines	if (Pred == ICmpInst::ICMP_EQ \|\| Pred == ICmpInst::ICMP_NE)
if (isCondRelevantToAnyCallArgument(Cmp, CS))		if (isCondRelevantToAnyCallArgument(Cmp, CS))
Conditions.push_back({Cmp, From->getTerminator()->getSuccessor(0) == To		Conditions.push_back({Cmp, From->getTerminator()->getSuccessor(0) == To
? Pred		? Pred
: Cmp->getInversePredicate()});		: Cmp->getInversePredicate()});
}		}

/// Record ICmp conditions relevant to any argument in CS following Pred's		/// Record ICmp conditions relevant to any argument in CS following Pred's
/// single successors. If there are conflicting conditions along a path, like		/// single successors. If there are conflicting conditions along a path, like
/// x == 1 and x == 0, the first condition will be used.		/// x == 1 and x == 0, the first condition will be used. We stop once we reach
		/// an edge to StopAt.
static void recordConditions(CallSite CS, BasicBlock *Pred,		static void recordConditions(CallSite CS, BasicBlock *Pred,
ConditionsTy &Conditions) {		ConditionsTy &Conditions, BasicBlock *StopAt) {
recordCondition(CS, Pred, CS.getInstruction()->getParent(), Conditions);		recordCondition(CS, Pred, CS.getInstruction()->getParent(), Conditions);
BasicBlock *From = Pred;		BasicBlock *From = Pred;
BasicBlock *To = Pred;		BasicBlock *To = Pred;
SmallPtrSet<BasicBlock *, 4> Visited;		SmallPtrSet<BasicBlock *, 4> Visited;
while (!Visited.count(From->getSinglePredecessor()) &&		while (!Visited.count(From->getSinglePredecessor()) &&
(From = From->getSinglePredecessor())) {		(From = From->getSinglePredecessor()) && To != StopAt) {
		junbumlUnsubmitted Not Done Reply Inline Actions It seems better to place "To != StopAt" first : while (To != StopAt && !Visited.count(From->getSinglePredecessor()) && (From = From->getSinglePredecessor())) junbuml: It seems better to place "To != StopAt" first : ``` while (To != StopAt && !Visited.count…
recordCondition(CS, From, To, Conditions);		recordCondition(CS, From, To, Conditions);
Visited.insert(From);		Visited.insert(From);
To = From;		To = From;
}		}
}		}

static void addConditions(CallSite CS, const ConditionsTy &Conditions) {		static void addConditions(CallSite CS, const ConditionsTy &Conditions) {
for (auto &Cond : Conditions) {		for (auto &Cond : Conditions) {
▲ Show 20 Lines • Show All 123 Lines • ▼ Show 20 Lines
/// %p = phi i1 [%ca1, %Tail-split1],[%ca2, %Tail-split2]		/// %p = phi i1 [%ca1, %Tail-split1],[%ca2, %Tail-split2]
///		///
/// Note that in case any arguments at the call-site are constrained by its		/// Note that in case any arguments at the call-site are constrained by its
/// predecessors, new call-sites with more constrained arguments will be		/// predecessors, new call-sites with more constrained arguments will be
/// created in createCallSitesOnPredicatedArgument().		/// created in createCallSitesOnPredicatedArgument().
static void splitCallSite(		static void splitCallSite(
CallSite CS,		CallSite CS,
const SmallVectorImpl<std::pair<BasicBlock *, ConditionsTy>> &Preds,		const SmallVectorImpl<std::pair<BasicBlock *, ConditionsTy>> &Preds,
DominatorTree *DT) {		DominatorTree &DT) {
Instruction *Instr = CS.getInstruction();		Instruction *Instr = CS.getInstruction();
BasicBlock *TailBB = Instr->getParent();		BasicBlock *TailBB = Instr->getParent();
bool IsMustTailCall = CS.isMustTailCall();		bool IsMustTailCall = CS.isMustTailCall();

PHINode *CallPN = nullptr;		PHINode *CallPN = nullptr;

// `musttail` calls must be followed by optional `bitcast`, and `ret`. The		// `musttail` calls must be followed by optional `bitcast`, and `ret`. The
// split blocks will be terminated right after that so there're no users for		// split blocks will be terminated right after that so there're no users for
// this phi in a `TailBB`.		// this phi in a `TailBB`.
if (!IsMustTailCall && !Instr->use_empty())		if (!IsMustTailCall && !Instr->use_empty())
CallPN = PHINode::Create(Instr->getType(), Preds.size(), "phi.call");		CallPN = PHINode::Create(Instr->getType(), Preds.size(), "phi.call");

DEBUG(dbgs() << "split call-site : " << *Instr << " into \n");		DEBUG(dbgs() << "split call-site : " << *Instr << " into \n");

assert(Preds.size() == 2 && "The ValueToValueMaps array has size 2.");		assert(Preds.size() == 2 && "The ValueToValueMaps array has size 2.");
// ValueToValueMapTy is neither copy nor moveable, so we use a simple array		// ValueToValueMapTy is neither copy nor moveable, so we use a simple array
// here.		// here.
ValueToValueMapTy ValueToValueMaps[2];		ValueToValueMapTy ValueToValueMaps[2];
for (unsigned i = 0; i < Preds.size(); i++) {		for (unsigned i = 0; i < Preds.size(); i++) {
BasicBlock *PredBB = Preds[i].first;		BasicBlock *PredBB = Preds[i].first;
BasicBlock *SplitBlock = DuplicateInstructionsInSplitBetween(		BasicBlock *SplitBlock = DuplicateInstructionsInSplitBetween(
TailBB, PredBB, &*std::next(Instr->getIterator()), ValueToValueMaps[i], DT);		TailBB, PredBB, &*std::next(Instr->getIterator()), ValueToValueMaps[i],
		&DT);
assert(SplitBlock && "Unexpected new basic block split.");		assert(SplitBlock && "Unexpected new basic block split.");

Instruction *NewCI =		Instruction *NewCI =
&*std::prev(SplitBlock->getTerminator()->getIterator());		&*std::prev(SplitBlock->getTerminator()->getIterator());
CallSite NewCS(NewCI);		CallSite NewCS(NewCI);
addConditions(NewCS, Preds[i].second);		addConditions(NewCS, Preds[i].second);

// Handle PHIs used as arguments in the call-site.		// Handle PHIs used as arguments in the call-site.
▲ Show 20 Lines • Show All 93 Lines • ▼ Show 20 Lines	if (PHINode *PN = dyn_cast<PHINode>(&BI)) {
return true;		return true;
}		}
}		}
break;		break;
}		}
return false;		return false;
}		}

static bool tryToSplitOnPHIPredicatedArgument(CallSite CS, DominatorTree *DT) {		static bool tryToSplitOnPHIPredicatedArgument(CallSite CS, DominatorTree &DT) {
if (!isPredicatedOnPHI(CS))		if (!isPredicatedOnPHI(CS))
return false;		return false;

auto Preds = getTwoPredecessors(CS.getInstruction()->getParent());		auto Preds = getTwoPredecessors(CS.getInstruction()->getParent());
SmallVector<std::pair<BasicBlock *, ConditionsTy>, 2> PredsCS = {		SmallVector<std::pair<BasicBlock *, ConditionsTy>, 2> PredsCS = {
{Preds[0], {}}, {Preds[1], {}}};		{Preds[0], {}}, {Preds[1], {}}};
splitCallSite(CS, PredsCS, DT);		splitCallSite(CS, PredsCS, DT);
return true;		return true;
}		}

static bool tryToSplitOnPredicatedArgument(CallSite CS, DominatorTree *DT) {		static bool tryToSplitOnPredicatedArgument(CallSite CS, DominatorTree &DT) {
auto Preds = getTwoPredecessors(CS.getInstruction()->getParent());		auto Preds = getTwoPredecessors(CS.getInstruction()->getParent());
if (Preds[0] == Preds[1])		if (Preds[0] == Preds[1])
return false;		return false;

		// We can stop recording conditions once we reached the immediate dominator
		// for the block containing the call site. Conditions in predecessors of the
		// that node will be the same for all paths to the call site and splitting
		// is not beneficial.
		auto *CSDTNode = DT.getNode(CS.getInstruction()->getParent());
		BasicBlock *StopAt = CSDTNode ? CSDTNode->getIDom()->getBlock() : nullptr;

SmallVector<std::pair<BasicBlock *, ConditionsTy>, 2> PredsCS;		SmallVector<std::pair<BasicBlock *, ConditionsTy>, 2> PredsCS;
for (auto *Pred : make_range(Preds.rbegin(), Preds.rend())) {		for (auto *Pred : make_range(Preds.rbegin(), Preds.rend())) {
ConditionsTy Conditions;		ConditionsTy Conditions;
recordConditions(CS, Pred, Conditions);		recordConditions(CS, Pred, Conditions, StopAt);
PredsCS.push_back({Pred, Conditions});		PredsCS.push_back({Pred, Conditions});
}		}

if (std::all_of(PredsCS.begin(), PredsCS.end(),		if (std::all_of(PredsCS.begin(), PredsCS.end(),
[](const std::pair<BasicBlock *, ConditionsTy> &P) {		[](const std::pair<BasicBlock *, ConditionsTy> &P) {
return P.second.empty();		return P.second.empty();
}))		}))
return false;		return false;

splitCallSite(CS, PredsCS, DT);		splitCallSite(CS, PredsCS, DT);
return true;		return true;
}		}

static bool tryToSplitCallSite(CallSite CS, TargetTransformInfo &TTI, DominatorTree *DT) {		static bool tryToSplitCallSite(CallSite CS, TargetTransformInfo &TTI,
if (!CS.arg_size() \|\| !canSplitCallSite(CS))		DominatorTree &DT) {
		if (!CS.arg_size() \|\| !canSplitCallSite(CS, TTI))
return false;		return false;
return tryToSplitOnPredicatedArgument(CS, DT) \|\|		return tryToSplitOnPredicatedArgument(CS, DT) \|\|
tryToSplitOnPHIPredicatedArgument(CS, DT);		tryToSplitOnPHIPredicatedArgument(CS, DT);
}		}

		junbumlUnsubmitted Not Done Reply Inline Actions I think we should move this to line 461. Otherwise, we wont be able to handle the case where a known value is not detected in immediate predecessors, but there is a known value after IDom. Looks like test_cond_no_effect() shows the case. junbuml: I think we should move this to line 461. Otherwise, we wont be able to handle the case where a…
		junbumlUnsubmitted Not Done Reply Inline Actions In this case (test_cond_no_effect), we should just pass the known value without splitting. Looks like I tried thing similar before in https://reviews.llvm.org/D41782. junbuml: In this case (test_cond_no_effect), we should just pass the known value without splitting.
		fhahnAuthorUnsubmitted Not Done Reply Inline Actions As this patch is at the moment, it is not a NFC, as it prevents splitting in case there are no suitable conditions along any path between the IDom and the call site. In this case (test_cond_no_effect), we should just pass the known value without splitting. Looks like I tried thing similar before in https://reviews.llvm.org/D41782. I just thought the same thing :) With my change, it should be quite straight forward to handle that case. But I would prefer to do that in a different patch fhahn: As this patch is at the moment, it is not a NFC, as it prevents splitting in case there are no…
		fhahnAuthorUnsubmitted Not Done Reply Inline Actions In this case (test_cond_no_effect), we should just pass the known value without splitting. Looks like I tried thing similar before in https://reviews.llvm.org/D41782. I thought a bit more about how to best handle propagating common facts that do not require splitting. I do not think we can do it properly here without making things to complicated. I've shared a WIP patch that is a first step towards enabling IPSCCP to propagate facts from compare instructions : D45330 fhahn: > In this case (test_cond_no_effect), we should just pass the known value without splitting.
static bool doCallSiteSplitting(Function &F, TargetLibraryInfo &TLI,		static bool doCallSiteSplitting(Function &F, TargetLibraryInfo &TLI,
TargetTransformInfo &TTI,		TargetTransformInfo &TTI, DominatorTree &DT) {
DominatorTree *DT) {
bool Changed = false;		bool Changed = false;
for (Function::iterator BI = F.begin(), BE = F.end(); BI != BE;) {		for (Function::iterator BI = F.begin(), BE = F.end(); BI != BE;) {
BasicBlock &BB = *BI++;		BasicBlock &BB = *BI++;
auto II = BB.getFirstNonPHIOrDbg()->getIterator();		auto II = BB.getFirstNonPHIOrDbg()->getIterator();
auto IE = BB.getTerminator()->getIterator();		auto IE = BB.getTerminator()->getIterator();
// Iterate until we reach the terminator instruction. tryToSplitCallSite		// Iterate until we reach the terminator instruction. tryToSplitCallSite
// can replace BB's terminator in case BB is a successor of itself. In that		// can replace BB's terminator in case BB is a successor of itself. In that
// case, IE will be invalidated and we also have to check the current		// case, IE will be invalidated and we also have to check the current
Show All 28 Lines	struct CallSiteSplittingLegacyPass : public FunctionPass {
static char ID;		static char ID;
CallSiteSplittingLegacyPass() : FunctionPass(ID) {		CallSiteSplittingLegacyPass() : FunctionPass(ID) {
initializeCallSiteSplittingLegacyPassPass(*PassRegistry::getPassRegistry());		initializeCallSiteSplittingLegacyPassPass(*PassRegistry::getPassRegistry());
}		}

void getAnalysisUsage(AnalysisUsage &AU) const override {		void getAnalysisUsage(AnalysisUsage &AU) const override {
AU.addRequired<TargetLibraryInfoWrapperPass>();		AU.addRequired<TargetLibraryInfoWrapperPass>();
AU.addRequired<TargetTransformInfoWrapperPass>();		AU.addRequired<TargetTransformInfoWrapperPass>();
		AU.addRequired<DominatorTreeWrapperPass>();
AU.addPreserved<DominatorTreeWrapperPass>();		AU.addPreserved<DominatorTreeWrapperPass>();
FunctionPass::getAnalysisUsage(AU);		FunctionPass::getAnalysisUsage(AU);
}		}

bool runOnFunction(Function &F) override {		bool runOnFunction(Function &F) override {
if (skipFunction(F))		if (skipFunction(F))
return false;		return false;

auto &TLI = getAnalysis<TargetLibraryInfoWrapperPass>().getTLI();		auto &TLI = getAnalysis<TargetLibraryInfoWrapperPass>().getTLI();
auto &TTI = getAnalysis<TargetTransformInfoWrapperPass>().getTTI(F);		auto &TTI = getAnalysis<TargetTransformInfoWrapperPass>().getTTI(F);
auto *DTWP = getAnalysisIfAvailable<DominatorTreeWrapperPass>();		auto &DT = getAnalysis<DominatorTreeWrapperPass>().getDomTree();
return doCallSiteSplitting(F, TLI, TTI, DTWP ? &DTWP->getDomTree() : nullptr);		return doCallSiteSplitting(F, TLI, TTI, DT);
}		}
};		};
} // namespace		} // namespace

char CallSiteSplittingLegacyPass::ID = 0;		char CallSiteSplittingLegacyPass::ID = 0;
INITIALIZE_PASS_BEGIN(CallSiteSplittingLegacyPass, "callsite-splitting",		INITIALIZE_PASS_BEGIN(CallSiteSplittingLegacyPass, "callsite-splitting",
"Call-site splitting", false, false)		"Call-site splitting", false, false)
INITIALIZE_PASS_DEPENDENCY(TargetLibraryInfoWrapperPass)		INITIALIZE_PASS_DEPENDENCY(TargetLibraryInfoWrapperPass)
INITIALIZE_PASS_DEPENDENCY(TargetTransformInfoWrapperPass)		INITIALIZE_PASS_DEPENDENCY(TargetTransformInfoWrapperPass)
		INITIALIZE_PASS_DEPENDENCY(DominatorTreeWrapperPass)
INITIALIZE_PASS_END(CallSiteSplittingLegacyPass, "callsite-splitting",		INITIALIZE_PASS_END(CallSiteSplittingLegacyPass, "callsite-splitting",
"Call-site splitting", false, false)		"Call-site splitting", false, false)
FunctionPass *llvm::createCallSiteSplittingPass() {		FunctionPass *llvm::createCallSiteSplittingPass() {
return new CallSiteSplittingLegacyPass();		return new CallSiteSplittingLegacyPass();
}		}

PreservedAnalyses CallSiteSplittingPass::run(Function &F,		PreservedAnalyses CallSiteSplittingPass::run(Function &F,
FunctionAnalysisManager &AM) {		FunctionAnalysisManager &AM) {
auto &TLI = AM.getResult<TargetLibraryAnalysis>(F);		auto &TLI = AM.getResult<TargetLibraryAnalysis>(F);
auto &TTI = AM.getResult<TargetIRAnalysis>(F);		auto &TTI = AM.getResult<TargetIRAnalysis>(F);
auto *DT = AM.getCachedResult<DominatorTreeAnalysis>(F);		auto &DT = AM.getResult<DominatorTreeAnalysis>(F);

if (!doCallSiteSplitting(F, TLI, TTI, DT))		if (!doCallSiteSplitting(F, TLI, TTI, DT))
return PreservedAnalyses::all();		return PreservedAnalyses::all();
PreservedAnalyses PA;		PreservedAnalyses PA;
PA.preserve<DominatorTreeAnalysis>();		PA.preserve<DominatorTreeAnalysis>();
return PA;		return PA;
}		}

test/Transforms/CallSiteSplitting/callsite-split-or-phi.ll

Show All 33 Lines
End:		End:
ret i32 %v		ret i32 %v
}		}

;CHECK-LABEL: @test_eq_eq_eq		;CHECK-LABEL: @test_eq_eq_eq
;CHECK-LABEL: Header2.split:		;CHECK-LABEL: Header2.split:
;CHECK: %[[CALL1:.]] = call i32 @callee(i32 null, i32 %v, i32 10)		;CHECK: %[[CALL1:.]] = call i32 @callee(i32 null, i32 %v, i32 10)
;CHECK-LABEL: TBB.split:		;CHECK-LABEL: TBB.split:
;CHECK: %[[CALL2:.]] = call i32 @callee(i32 null, i32 1, i32 %p)		;CHECK: %[[CALL2:.]] = call i32 @callee(i32 %a, i32 1, i32 %p)
;CHECK-LABEL: Tail		;CHECK-LABEL: Tail
;CHECK: %[[MERGED:.*]] = phi i32 [ %[[CALL1]], %Header2.split ], [ %[[CALL2]], %TBB.split ]		;CHECK: %[[MERGED:.*]] = phi i32 [ %[[CALL1]], %Header2.split ], [ %[[CALL2]], %TBB.split ]
;CHECK: ret i32 %[[MERGED]]		;CHECK: ret i32 %[[MERGED]]
define i32 @test_eq_eq_eq(i32* %a, i32 %v, i32 %p) {		define i32 @test_eq_eq_eq(i32* %a, i32 %v, i32 %p) {
junbumlUnsubmitted Not Done Reply Inline Actions We may want to keep this test as it is. With this patch, the call sites split will take %a, instead of null. null value might be propagated to the callsite later in the pipeline, but there is no reason not to pass the known null value early in the pipeline. If the callee has early exit condition with null check. Inliner may have better opportunity to get this callee inlined by passing null. junbuml: We may want to keep this test as it is. With this patch, the call sites split will take %a…
fhahnAuthorUnsubmitted Not Done Reply Inline Actions Ah yes, if we split anyways, we could also propagate other known constraints. fhahn: Ah yes, if we split anyways, we could also propagate other known constraints.
junbumlUnsubmitted Not Done Reply Inline Actions This may show that inliner fail to inline the callee with this change. define i32 @test_eq_eq_eq(i32* %a, i32 %v, i32 %p) { Header: %tobool1 = icmp eq i32* %a, null br i1 %tobool1, label %Header2, label %End Header2: %tobool2 = icmp eq i32 %p, 10 call void @dummy() br i1 %tobool2, label %Tail, label %TBB TBB: %cmp = icmp eq i32 %v, 1 call void @dummy() br i1 %cmp, label %Tail, label %End Tail: %r = call i32 @callee(i32* %a, i32 %v, i32 %p) ret i32 %r End: ret i32 %v } define i32 @callee(i32* %a, i32 %v, i32 %p) { entry: %c = icmp eq i32* %a, null br i1 %c, label %BB1, label %BB2 BB1: ret i32 0 BB2: call void @dummy2(i32 %v, i32 %p) call void @dummy2(i32 %v, i32 %p) call void @dummy2(i32 %v, i32 %p) call void @dummy2(i32 %v, i32 %p) call void @dummy2(i32 %v, i32 %p) call void @dummy2(i32 %v, i32 %p) call void @dummy2(i32 %v, i32 %p) call void @dummy2(i32 %v, i32 %p) call void @dummy2(i32 %v, i32 %p) call void @dummy2(i32 %v, i32 %p) call void @dummy2(i32 %v, i32 %p) call void @dummy2(i32 %v, i32 %p) call void @dummy2(i32 %v, i32 %p) call void @dummy2(i32 %v, i32 %p) br label %End End: ret i32 %p } declare void @dummy() declare void @dummy2(i32, i32) junbuml: This may show that inliner fail to inline the callee with this change. ``` define i32…
Header:		Header:
%tobool1 = icmp eq i32* %a, null		%tobool1 = icmp eq i32* %a, null
br i1 %tobool1, label %Header2, label %End		br i1 %tobool1, label %Header2, label %TBB

Header2:		Header2:
%tobool2 = icmp eq i32 %p, 10		%tobool2 = icmp eq i32 %p, 10
br i1 %tobool2, label %Tail, label %TBB		br i1 %tobool2, label %Tail, label %TBB

TBB:		TBB:
%cmp = icmp eq i32 %v, 1		%cmp = icmp eq i32 %v, 1
br i1 %cmp, label %Tail, label %End		br i1 %cmp, label %Tail, label %End
▲ Show 20 Lines • Show All 60 Lines • ▼ Show 20 Lines
End:		End:
ret i32 %v		ret i32 %v
}		}

;CHECK-LABEL: @test_ne_eq_ne		;CHECK-LABEL: @test_ne_eq_ne
;CHECK-LABEL: Header2.split:		;CHECK-LABEL: Header2.split:
;CHECK: %[[CALL1:.]] = call i32 @callee(i32 nonnull %a, i32 %v, i32 10)		;CHECK: %[[CALL1:.]] = call i32 @callee(i32 nonnull %a, i32 %v, i32 10)
;CHECK-LABEL: TBB.split:		;CHECK-LABEL: TBB.split:
;CHECK: %[[CALL2:.]] = call i32 @callee(i32 nonnull %a, i32 %v, i32 %p)		;CHECK: %[[CALL2:.]] = call i32 @callee(i32 %a, i32 %v, i32 %p)
;CHECK-LABEL: Tail		;CHECK-LABEL: Tail
;CHECK: %[[MERGED:.*]] = phi i32 [ %[[CALL1]], %Header2.split ], [ %[[CALL2]], %TBB.split ]		;CHECK: %[[MERGED:.*]] = phi i32 [ %[[CALL1]], %Header2.split ], [ %[[CALL2]], %TBB.split ]
;CHECK: ret i32 %[[MERGED]]		;CHECK: ret i32 %[[MERGED]]
define i32 @test_ne_eq_ne(i32* %a, i32 %v, i32 %p) {		define i32 @test_ne_eq_ne(i32* %a, i32 %v, i32 %p) {
Header:		Header:
%tobool1 = icmp ne i32* %a, null		%tobool1 = icmp ne i32* %a, null
br i1 %tobool1, label %Header2, label %End		br i1 %tobool1, label %Header2, label %TBB
junbumlUnsubmitted Not Done Reply Inline Actions We should keep this test to check that nonnull is passed to both call-sites. junbuml: We should keep this test to check that nonnull is passed to both call-sites.
		junbumlUnsubmitted Not Done Reply Inline Actions We can add this test, but I don't think there is any change in this test with/without this patch. junbuml: We can add this test, but I don't think there is any change in this test with/without this…

Header2:		Header2:
%tobool2 = icmp eq i32 %p, 10		%tobool2 = icmp eq i32 %p, 10
br i1 %tobool2, label %Tail, label %TBB		br i1 %tobool2, label %Tail, label %TBB

TBB:		TBB:
%cmp = icmp ne i32 %v, 1		%cmp = icmp ne i32 %v, 1
br i1 %cmp, label %Tail, label %End		br i1 %cmp, label %Tail, label %End
Show All 31 Lines
End:		End:
ret i32 %v		ret i32 %v
}		}

;CHECK-LABEL: @test_ne_ne_ne_constrain_same_pointer_arg		;CHECK-LABEL: @test_ne_ne_ne_constrain_same_pointer_arg
;CHECK-LABEL: Header2.split:		;CHECK-LABEL: Header2.split:
;CHECK: %[[CALL1:.]] = call i32 @callee(i32 nonnull %a, i32 %v, i32 %p)		;CHECK: %[[CALL1:.]] = call i32 @callee(i32 nonnull %a, i32 %v, i32 %p)
;CHECK-LABEL: TBB.split:		;CHECK-LABEL: TBB.split:
;CHECK: %[[CALL2:.]] = call i32 @callee(i32 nonnull %a, i32 %v, i32 %p)		;CHECK: %[[CALL2:.]] = call i32 @callee(i32 %a, i32 %v, i32 %p)
;CHECK-LABEL: Tail		;CHECK-LABEL: Tail
;CHECK: %[[MERGED:.*]] = phi i32 [ %[[CALL1]], %Header2.split ], [ %[[CALL2]], %TBB.split ]		;CHECK: %[[MERGED:.*]] = phi i32 [ %[[CALL1]], %Header2.split ], [ %[[CALL2]], %TBB.split ]
;CHECK: ret i32 %[[MERGED]]		;CHECK: ret i32 %[[MERGED]]
define i32 @test_ne_ne_ne_constrain_same_pointer_arg(i32* %a, i32 %v, i32 %p, i32* %a2, i32* %a3) {		define i32 @test_ne_ne_ne_constrain_same_pointer_arg(i32* %a, i32 %v, i32 %p, i32* %a2, i32* %a3) {
junbumlUnsubmitted Not Done Reply Inline Actions We should keep this test to check that nonnull is passed to both call-sites. junbuml: We should keep this test to check that nonnull is passed to both call-sites.
Header:		Header:
%tobool1 = icmp ne i32* %a, null		%tobool1 = icmp ne i32* %a, null
br i1 %tobool1, label %Header2, label %End		br i1 %tobool1, label %Header2, label %TBB

Header2:		Header2:
%tobool2 = icmp ne i32* %a, %a2		%tobool2 = icmp ne i32* %a, %a2
br i1 %tobool2, label %Tail, label %TBB		br i1 %tobool2, label %Tail, label %TBB

TBB:		TBB:
%cmp = icmp ne i32* %a, %a3		%cmp = icmp ne i32* %a, %a3
br i1 %cmp, label %Tail, label %End		br i1 %cmp, label %Tail, label %End
Show All 33 Lines
End:		End:
ret i32 %v		ret i32 %v
}		}

;CHECK-LABEL: @test_eq_eq_eq_untaken		;CHECK-LABEL: @test_eq_eq_eq_untaken
;CHECK-LABEL: Header2.split:		;CHECK-LABEL: Header2.split:
;CHECK: %[[CALL1:.]] = call i32 @callee(i32 nonnull %a, i32 %v, i32 10)		;CHECK: %[[CALL1:.]] = call i32 @callee(i32 nonnull %a, i32 %v, i32 10)
;CHECK-LABEL: TBB.split:		;CHECK-LABEL: TBB.split:
;CHECK: %[[CALL2:.]] = call i32 @callee(i32 nonnull %a, i32 1, i32 %p)		;CHECK: %[[CALL2:.]] = call i32 @callee(i32 %a, i32 1, i32 %p)
;CHECK-LABEL: Tail		;CHECK-LABEL: Tail
;CHECK: %[[MERGED:.*]] = phi i32 [ %[[CALL1]], %Header2.split ], [ %[[CALL2]], %TBB.split ]		;CHECK: %[[MERGED:.*]] = phi i32 [ %[[CALL1]], %Header2.split ], [ %[[CALL2]], %TBB.split ]
;CHECK: ret i32 %[[MERGED]]		;CHECK: ret i32 %[[MERGED]]
define i32 @test_eq_eq_eq_untaken(i32* %a, i32 %v, i32 %p) {		define i32 @test_eq_eq_eq_untaken(i32* %a, i32 %v, i32 %p) {
Header:		Header:
%tobool1 = icmp eq i32* %a, null		%tobool1 = icmp eq i32* %a, null
br i1 %tobool1, label %End, label %Header2		br i1 %tobool1, label %TBB, label %Header2

Header2:		Header2:
%tobool2 = icmp eq i32 %p, 10		%tobool2 = icmp eq i32 %p, 10
br i1 %tobool2, label %Tail, label %TBB		br i1 %tobool2, label %Tail, label %TBB

TBB:		TBB:
%cmp = icmp eq i32 %v, 1		%cmp = icmp eq i32 %v, 1
br i1 %cmp, label %Tail, label %End		br i1 %cmp, label %Tail, label %End
Show All 31 Lines
End:		End:
ret i32 %v		ret i32 %v
}		}

;CHECK-LABEL: @test_ne_eq_ne_untaken		;CHECK-LABEL: @test_ne_eq_ne_untaken
;CHECK-LABEL: Header2.split:		;CHECK-LABEL: Header2.split:
;CHECK: %[[CALL1:.]] = call i32 @callee(i32 null, i32 %v, i32 10)		;CHECK: %[[CALL1:.]] = call i32 @callee(i32 null, i32 %v, i32 10)
;CHECK-LABEL: TBB.split:		;CHECK-LABEL: TBB.split:
;CHECK: %[[CALL2:.]] = call i32 @callee(i32 null, i32 %v, i32 %p)		;CHECK: %[[CALL2:.]] = call i32 @callee(i32 %a, i32 %v, i32 %p)
;CHECK-LABEL: Tail		;CHECK-LABEL: Tail
;CHECK: %[[MERGED:.*]] = phi i32 [ %[[CALL1]], %Header2.split ], [ %[[CALL2]], %TBB.split ]		;CHECK: %[[MERGED:.*]] = phi i32 [ %[[CALL1]], %Header2.split ], [ %[[CALL2]], %TBB.split ]
;CHECK: ret i32 %[[MERGED]]		;CHECK: ret i32 %[[MERGED]]
define i32 @test_ne_eq_ne_untaken(i32* %a, i32 %v, i32 %p) {		define i32 @test_ne_eq_ne_untaken(i32* %a, i32 %v, i32 %p) {
Header:		Header:
%tobool1 = icmp ne i32* %a, null		%tobool1 = icmp ne i32* %a, null
br i1 %tobool1, label %End, label %Header2		br i1 %tobool1, label %TBB, label %Header2

Header2:		Header2:
%tobool2 = icmp eq i32 %p, 10		%tobool2 = icmp eq i32 %p, 10
br i1 %tobool2, label %Tail, label %TBB		br i1 %tobool2, label %Tail, label %TBB

TBB:		TBB:
%cmp = icmp ne i32 %v, 1		%cmp = icmp ne i32 %v, 1
br i1 %cmp, label %Tail, label %End		br i1 %cmp, label %Tail, label %End
▲ Show 20 Lines • Show All 175 Lines • ▼ Show 20 Lines	Tail:
%p = phi i32[1,%Header], [2, %TBB]		%p = phi i32[1,%Header], [2, %TBB]
%r = call i32 @callee(i32* %a, i32 %v, i32 %p)		%r = call i32 @callee(i32* %a, i32 %v, i32 %p)
ret i32 %r		ret i32 %r

End:		End:
ret i32 %v		ret i32 %v
}		}

		;CHECK-LABEL: @test_cond_no_effect
		;CHECK-NOT: Header.split:
		;CHECK-NOT: TBB.split:
		;CHECK-LABEL: Tail:
		;CHECK: %r = call i32 @callee(i32* %a, i32 %v, i32 0)
		;CHECK: ret i32 %r
		define i32 @test_cond_no_effect(i32* %a, i32 %v) {
		Entry:
		%tobool1 = icmp eq i32* %a, null
		br i1 %tobool1, label %Header, label %End

		Header:
		br i1 undef, label %Tail, label %TBB

		TBB:
		br i1 undef, label %Tail, label %End

		Tail:
		%r = call i32 @callee(i32* %a, i32 %v, i32 0)
		ret i32 %r

		End:
		ret i32 %v
		}

;CHECK-LABEL: @test_unreachable		;CHECK-LABEL: @test_unreachable
;CHECK-LABEL: Header.split:		;CHECK-LABEL: Header.split:
;CHECK: %[[CALL1:.]] = call i32 @callee(i32 %a, i32 %v, i32 10)		;CHECK: %[[CALL1:.]] = call i32 @callee(i32 %a, i32 %v, i32 10)
;CHECK-LABEL: TBB.split:		;CHECK-LABEL: TBB.split:
;CHECK: %[[CALL2:.]] = call i32 @callee(i32 %a, i32 1, i32 %p)		;CHECK: %[[CALL2:.]] = call i32 @callee(i32 %a, i32 1, i32 %p)
;CHECK-LABEL: Tail		;CHECK-LABEL: Tail
;CHECK: %[[MERGED:.*]] = phi i32 [ %[[CALL1]], %Header.split ], [ %[[CALL2]], %TBB.split ]		;CHECK: %[[MERGED:.*]] = phi i32 [ %[[CALL1]], %Header.split ], [ %[[CALL2]], %TBB.split ]
;CHECK: ret i32 %[[MERGED]]		;CHECK: ret i32 %[[MERGED]]
Show All 35 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[CallSiteSplitting] Only record conditions up to the IDom(call site).
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 138927

lib/Transforms/Scalar/CallSiteSplitting.cpp

test/Transforms/CallSiteSplitting/callsite-split-or-phi.ll

This is an archive of the discontinued LLVM Phabricator instance.

[CallSiteSplitting] Only record conditions up to the IDom(call site).ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 138927

lib/Transforms/Scalar/CallSiteSplitting.cpp

test/Transforms/CallSiteSplitting/callsite-split-or-phi.ll

[CallSiteSplitting] Only record conditions up to the IDom(call site).
ClosedPublic