Diff 278749

llvm/lib/Transforms/Utils/SimplifyCFG.cpp

Show First 20 Lines • Show All 1,985 Lines • ▼ Show 20 Lines	for (Instruction &CurI : reverse(BrBB->instructionsWithoutDebug())) {
}		}
}		}

return nullptr;		return nullptr;
}		}

/// Speculate a conditional basic block flattening the CFG.		/// Speculate a conditional basic block flattening the CFG.
///		///
/// Note that this is a very risky transform currently. Speculating		/// Note that this is a very risky transform currently. Speculating
		lebedev.riUnsubmitted Not Done Reply Inline Actions I do not understand what is going on in this function. Why are we comparing each separate cost with threshold, instead of accumulating the costs and comparing that? lebedev.ri: I do not understand what is going on in this function. Why are we comparing each separate cost…
		samparkerAuthorUnsubmitted Done Reply Inline Actions Hmm, I hadn't noticed that. Certainly happy to look into that next. samparker: Hmm, I hadn't noticed that. Certainly happy to look into that next.
/// instructions like this is most often not desirable. Instead, there is an MI		/// instructions like this is most often not desirable. Instead, there is an MI
/// pass which can do it with full awareness of the resource constraints.		/// pass which can do it with full awareness of the resource constraints.
/// However, some cases are "obvious" and we should do directly. An example of		/// However, some cases are "obvious" and we should do directly. An example of
/// this is speculating a single, reasonably cheap instruction.		/// this is speculating a single, reasonably cheap instruction.
///		///
/// There is only one distinct advantage to flattening the CFG at the IR level:		/// There is only one distinct advantage to flattening the CFG at the IR level:
/// it makes very common but simplistic optimizations such as are common in		/// it makes very common but simplistic optimizations such as are common in
/// instcombine and the DAG combiner more powerful by removing CFG edges and		/// instcombine and the DAG combiner more powerful by removing CFG edges and
/// modeling their effects with easier to reason about SSA value graphs.		/// modeling their effects with easier to reason about SSA value graphs.
///		///
///		///
/// An illustration of this transform is turning this IR:		/// An illustration of this transform is turning this IR:
/// \code		/// \code
/// BB:		/// BB:
/// %cmp = icmp ult %x, %y		/// %cmp = icmp ult %x, %y
/// br i1 %cmp, label %EndBB, label %ThenBB		/// br i1 %cmp, label %EndBB, label %ThenBB
/// ThenBB:		/// ThenBB:
/// %sub = sub %x, %y		/// %sub = sub %x, %y
/// br label BB2		/// br label BB2
/// EndBB:		/// EndBB:
/// %phi = phi [ %sub, %ThenBB ], [ 0, %EndBB ]		/// %phi = phi [ %sub, %ThenBB ], [ 0, %EndBB ]
/// ...		/// ...
		lebedev.riUnsubmitted Not Done Reply Inline Actions if (CostOfSelects > PHINodeFoldingThreshold * TargetTransformInfo::TCC_Basic) lebedev.ri: if (CostOfSelects > PHINodeFoldingThreshold * TargetTransformInfo::TCC_Basic)
/// \endcode		/// \endcode
///		///
/// Into this IR:		/// Into this IR:
/// \code		/// \code
/// BB:		/// BB:
/// %cmp = icmp ult %x, %y		/// %cmp = icmp ult %x, %y
/// %sub = sub %x, %y		/// %sub = sub %x, %y
/// %cond = select i1 %cmp, 0, %sub		/// %cond = select i1 %cmp, 0, %sub
/// ...		/// ...
/// \endcode		/// \endcode
///		///
/// \returns true if the conditional block is removed.		/// \returns true if the conditional block is removed.
bool SimplifyCFGOpt::SpeculativelyExecuteBB(BranchInst BI, BasicBlock ThenBB,		bool SimplifyCFGOpt::SpeculativelyExecuteBB(BranchInst BI, BasicBlock ThenBB,
const TargetTransformInfo &TTI) {		const TargetTransformInfo &TTI) {
// Be conservative for now. FP select instruction can often be expensive.		// Be conservative for now. FP select instruction can often be expensive.
Value *BrCond = BI->getCondition();		Value *BrCond = BI->getCondition();
if (isa<FCmpInst>(BrCond))		if (isa<FCmpInst>(BrCond))
return false;		return false;

BasicBlock *BB = BI->getParent();		BasicBlock *BB = BI->getParent();
BasicBlock *EndBB = ThenBB->getTerminator()->getSuccessor(0);		BasicBlock *EndBB = ThenBB->getTerminator()->getSuccessor(0);

		// Check how expensive it will be to insert the necessary selects.
		unsigned CostOfSelects = 0;
		for (PHINode &PN : EndBB->phis()) {
		unsigned OrigI = PN.getBasicBlockIndex(BB);
		unsigned ThenI = PN.getBasicBlockIndex(ThenBB);
		Value *OrigV = PN.getIncomingValue(OrigI);
		Value *ThenV = PN.getIncomingValue(ThenI);
		if (OrigV != ThenV)
		CostOfSelects +=
		TTI.getCmpSelInstrCost(Instruction::Select, PN.getType(), nullptr,
		TargetTransformInfo::TCK_SizeAndLatency);
		}
		if (CostOfSelects > PHINodeFoldingThreshold * TargetTransformInfo::TCC_Basic)
		return false;

// If ThenBB is actually on the false edge of the conditional branch, remember		// If ThenBB is actually on the false edge of the conditional branch, remember
// to swap the select operands later.		// to swap the select operands later.
bool Invert = false;		bool Invert = false;
if (ThenBB != BI->getSuccessor(0)) {		if (ThenBB != BI->getSuccessor(0)) {
assert(ThenBB == BI->getSuccessor(1) && "No edge from 'if' block?");		assert(ThenBB == BI->getSuccessor(1) && "No edge from 'if' block?");
Invert = true;		Invert = true;
}		}
assert(EndBB == BI->getSuccessor(!Invert) && "No edge from to end block");		assert(EndBB == BI->getSuccessor(!Invert) && "No edge from to end block");
Show All 27 Lines	if (SpeculatedInstructions > 1)
return false;		return false;

// Don't hoist the instruction if it's unsafe or expensive.		// Don't hoist the instruction if it's unsafe or expensive.
if (!isSafeToSpeculativelyExecute(I) &&		if (!isSafeToSpeculativelyExecute(I) &&
!(HoistCondStores && (SpeculatedStoreValue = isSafeToSpeculateStore(		!(HoistCondStores && (SpeculatedStoreValue = isSafeToSpeculateStore(
I, BB, ThenBB, EndBB))))		I, BB, ThenBB, EndBB))))
return false;		return false;
if (!SpeculatedStoreValue &&		if (!SpeculatedStoreValue &&
ComputeSpeculationCost(I, TTI) >		ComputeSpeculationCost(I, TTI) >
PHINodeFoldingThreshold * TargetTransformInfo::TCC_Basic)		PHINodeFoldingThreshold * TargetTransformInfo::TCC_Basic)
		lebedev.riUnsubmitted Not Done Reply Inline Actions here too lebedev.ri: here too
return false;		return false;

// Store the store speculation candidate.		// Store the store speculation candidate.
if (SpeculatedStoreValue)		if (SpeculatedStoreValue)
SpeculatedStore = cast<StoreInst>(I);		SpeculatedStore = cast<StoreInst>(I);

// Do not hoist the instruction if any of its operands are defined but not		// Do not hoist the instruction if any of its operands are defined but not
// used in BB. The transformation will prevent the operand from		// used in BB. The transformation will prevent the operand from
Show All 40 Lines	for (PHINode &PN : EndBB->phis()) {
ConstantExpr *OrigCE = dyn_cast<ConstantExpr>(OrigV);		ConstantExpr *OrigCE = dyn_cast<ConstantExpr>(OrigV);
ConstantExpr *ThenCE = dyn_cast<ConstantExpr>(ThenV);		ConstantExpr *ThenCE = dyn_cast<ConstantExpr>(ThenV);
if (!OrigCE && !ThenCE)		if (!OrigCE && !ThenCE)
continue; // Known safe and cheap.		continue; // Known safe and cheap.

if ((ThenCE && !isSafeToSpeculativelyExecute(ThenCE)) \|\|		if ((ThenCE && !isSafeToSpeculativelyExecute(ThenCE)) \|\|
(OrigCE && !isSafeToSpeculativelyExecute(OrigCE)))		(OrigCE && !isSafeToSpeculativelyExecute(OrigCE)))
return false;		return false;
unsigned OrigCost = OrigCE ? ComputeSpeculationCost(OrigCE, TTI) : 0;		unsigned OrigCost = OrigCE ? ComputeSpeculationCost(OrigCE, TTI) : 0;
unsigned ThenCost = ThenCE ? ComputeSpeculationCost(ThenCE, TTI) : 0;		unsigned ThenCost = ThenCE ? ComputeSpeculationCost(ThenCE, TTI) : 0;
unsigned MaxCost =		unsigned MaxCost =
2 * PHINodeFoldingThreshold * TargetTransformInfo::TCC_Basic;		2 * PHINodeFoldingThreshold * TargetTransformInfo::TCC_Basic;
if (OrigCost + ThenCost > MaxCost)		if (OrigCost + ThenCost > MaxCost)
return false;		return false;
		lebedev.riUnsubmitted Not Done Reply Inline Actions and here lebedev.ri: and here

// Account for the cost of an unfolded ConstantExpr which could end up		// Account for the cost of an unfolded ConstantExpr which could end up
// getting expanded into Instructions.		// getting expanded into Instructions.
// FIXME: This doesn't account for how many operations are combined in the		// FIXME: This doesn't account for how many operations are combined in the
// constant expression.		// constant expression.
++SpeculatedInstructions;		++SpeculatedInstructions;
if (SpeculatedInstructions > 1)		if (SpeculatedInstructions > 1)
return false;		return false;
▲ Show 20 Lines • Show All 4,131 Lines • Show Last 20 Lines

llvm/test/Transforms/SimplifyCFG/ARM/select-costs.ll

; NOTE: Assertions have been autogenerated by utils/update_test_checks.py		; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
		mkazantsevUnsubmitted Not Done Reply Inline Actions I also don't quite get what this is about. I'd suggest the following: Check in this test as is, without review, with current auto-generated checks; Diff in patch will show what changed. mkazantsev: I also don't quite get what this is about. I'd suggest the following: - Check in this test as…
; RUN: opt -mtriple=thumbv8.1m.main -simplifycfg -S %s -o - \| FileCheck %s --check-prefix=V8M		; RUN: opt -mtriple=thumbv8.1m.main -simplifycfg -S %s -o - \| FileCheck %s --check-prefix=V8M
; RUN: opt -mtriple=thumbv8m.main -simplifycfg -S %s -o - \| FileCheck %s --check-prefix=V8M		; RUN: opt -mtriple=thumbv8m.main -simplifycfg -S %s -o - \| FileCheck %s --check-prefix=V8M
; RUN: opt -mtriple=thumbv8m.base -simplifycfg -S %s -o - \| FileCheck %s --check-prefix=V8M		; RUN: opt -mtriple=thumbv8m.base -simplifycfg -S %s -o - \| FileCheck %s --check-prefix=V8M
		fhahnUnsubmitted Not Done Reply Inline Actions I think it would be good to also add a triple for which we hoist the code, to ensure the test keeps testing what we want. fhahn: I think it would be good to also add a triple for which we hoist the code, to ensure the test…
; RUN: opt -mtriple=armv8a -simplifycfg -S %s -o - \| FileCheck %s --check-prefix=V8A		; RUN: opt -mtriple=armv8a -simplifycfg -S %s -o - \| FileCheck %s --check-prefix=V8A

; Test that the phis from for.inc.preheader aren't hoisted into sw.bb92 because		; Test that the phis from for.inc.preheader aren't hoisted into sw.bb92 because
; the cost is too great - we can make a better decision later on.		; the cost is too great - we can make a better decision later on.
define i32 @multiple_spec_select_costs(i8* %a, i32* %idx, i8 %in) {		define i32 @multiple_spec_select_costs(i8* %a, i32* %idx, i8 %in) {
; V8M-LABEL: @multiple_spec_select_costs(		; V8M-LABEL: @multiple_spec_select_costs(
; V8M-NEXT: entry:		; V8M-NEXT: entry:
; V8M-NEXT: [[GEP_A_2:%.]] = getelementptr inbounds i8, i8 [[A:%.*]], i32 2		; V8M-NEXT: [[GEP_A_2:%.]] = getelementptr inbounds i8, i8 [[A:%.*]], i32 2
; V8M-NEXT: [[INCDEC_PTR109_C4:%.]] = getelementptr inbounds i8, i8 [[A]], i32 3		; V8M-NEXT: [[INCDEC_PTR109_C4:%.]] = getelementptr inbounds i8, i8 [[A]], i32 3
; V8M-NEXT: [[ZERO:%.]] = icmp ne i8 [[IN:%.]], 0		; V8M-NEXT: [[ZERO:%.]] = icmp ne i8 [[IN:%.]], 0
; V8M-NEXT: br i1 [[ZERO]], label [[FOR_INC_PREHEADER:%.]], label [[SW_BB92:%.]]		; V8M-NEXT: br i1 [[ZERO]], label [[FOR_INC_PREHEADER:%.]], label [[SW_BB92:%.]]
; V8M: sw.bb92:		; V8M: sw.bb92:
; V8M-NEXT: [[C_OFF_I150:%.*]] = add i8 [[IN]], -48		; V8M-NEXT: [[C_OFF_I150:%.*]] = add i8 [[IN]], -48
; V8M-NEXT: [[UGT_9:%.*]] = icmp ugt i8 [[C_OFF_I150]], 9		; V8M-NEXT: [[UGT_9:%.*]] = icmp ugt i8 [[C_OFF_I150]], 9
; V8M-NEXT: [[SPEC_SELECT:%.*]] = select i1 [[UGT_9]], i1 false, i1 true		; V8M-NEXT: br i1 [[UGT_9]], label [[FOR_INC_PREHEADER]], label [[SELECT_UNFOLD198:%.*]]
; V8M-NEXT: [[SPEC_SELECT1:%.*]] = select i1 [[UGT_9]], i32 1, i32 7		; V8M: select.unfold198:
; V8M-NEXT: br label [[FOR_INC_PREHEADER]]		; V8M-NEXT: br label [[FOR_INC_PREHEADER]]
; V8M: for.inc.preheader:		; V8M: for.inc.preheader:
; V8M-NEXT: [[STR_PH_0:%.]] = phi i8 [ [[GEP_A_2]], [[ENTRY:%.*]] ], [ [[INCDEC_PTR109_C4]], [[SW_BB92]] ]		; V8M-NEXT: [[STR_PH_0:%.]] = phi i8 [ [[INCDEC_PTR109_C4]], [[SELECT_UNFOLD198]] ], [ [[INCDEC_PTR109_C4]], [[SW_BB92]] ], [ [[GEP_A_2]], [[ENTRY:%.*]] ]
; V8M-NEXT: [[CMP:%.*]] = phi i1 [ false, [[ENTRY]] ], [ [[SPEC_SELECT]], [[SW_BB92]] ]		; V8M-NEXT: [[CMP:%.*]] = phi i1 [ true, [[SELECT_UNFOLD198]] ], [ false, [[SW_BB92]] ], [ false, [[ENTRY]] ]
; V8M-NEXT: [[PHI_RES:%.*]] = phi i32 [ 1, [[ENTRY]] ], [ [[SPEC_SELECT1]], [[SW_BB92]] ]		; V8M-NEXT: [[PHI_RES:%.*]] = phi i32 [ 7, [[SELECT_UNFOLD198]] ], [ 1, [[SW_BB92]] ], [ 1, [[ENTRY]] ]
; V8M-NEXT: br label [[FOR_INC:%.*]]		; V8M-NEXT: br label [[FOR_INC:%.*]]
; V8M: for.inc:		; V8M: for.inc:
; V8M-NEXT: [[STR_PH_1:%.]] = phi i8 [ [[INCDEC_PTR109:%.]], [[FOR_BODY:%.]] ], [ [[STR_PH_0]], [[FOR_INC_PREHEADER]] ]		; V8M-NEXT: [[STR_PH_1:%.]] = phi i8 [ [[INCDEC_PTR109:%.]], [[FOR_BODY:%.]] ], [ [[STR_PH_0]], [[FOR_INC_PREHEADER]] ]
; V8M-NEXT: [[INCDEC_PTR109]] = getelementptr inbounds i8, i8* [[STR_PH_1]], i32 1		; V8M-NEXT: [[INCDEC_PTR109]] = getelementptr inbounds i8, i8* [[STR_PH_1]], i32 1
; V8M-NEXT: [[LOAD_1:%.]] = load i8, i8 [[INCDEC_PTR109]], align 1		; V8M-NEXT: [[LOAD_1:%.]] = load i8, i8 [[INCDEC_PTR109]], align 1
; V8M-NEXT: [[TOBOOL:%.*]] = icmp ne i8 [[LOAD_1]], 0		; V8M-NEXT: [[TOBOOL:%.*]] = icmp ne i8 [[LOAD_1]], 0
; V8M-NEXT: [[AND:%.*]] = and i1 [[CMP]], [[TOBOOL]]		; V8M-NEXT: [[AND:%.*]] = and i1 [[CMP]], [[TOBOOL]]
; V8M-NEXT: br i1 [[AND]], label [[FOR_BODY]], label [[EXIT:%.*]]		; V8M-NEXT: br i1 [[AND]], label [[FOR_BODY]], label [[EXIT:%.*]]
▲ Show 20 Lines • Show All 45 Lines • ▼ Show 20 Lines	sw.bb92:
br i1 %ugt.9, label %for.inc.preheader, label %select.unfold198		br i1 %ugt.9, label %for.inc.preheader, label %select.unfold198

select.unfold198:		select.unfold198:
br label %for.inc.preheader		br label %for.inc.preheader

for.inc.preheader:		for.inc.preheader:
%str.ph.0 = phi i8* [ %incdec.ptr109.c4, %select.unfold198 ], [ %incdec.ptr109.c4, %sw.bb92 ], [ %gep.a.2, %entry ]		%str.ph.0 = phi i8* [ %incdec.ptr109.c4, %select.unfold198 ], [ %incdec.ptr109.c4, %sw.bb92 ], [ %gep.a.2, %entry ]
%cmp = phi i1 [ true, %select.unfold198 ], [ false, %sw.bb92 ], [ false, %entry ]		%cmp = phi i1 [ true, %select.unfold198 ], [ false, %sw.bb92 ], [ false, %entry ]
%phi.res = phi i32 [ 7, %select.unfold198 ], [ 1, %sw.bb92 ], [ 1, %entry ]		%phi.res = phi i32 [ 7, %select.unfold198 ], [ 1, %sw.bb92 ], [ 1, %entry ]
		RKSimonUnsubmitted Not Done Reply Inline Actions Can you cleanup/reduce this test case any further? RKSimon: Can you cleanup/reduce this test case any further?
br label %for.inc		br label %for.inc

for.inc:		for.inc:
%str.ph.1 = phi i8* [ %incdec.ptr109, %for.body ], [ %str.ph.0, %for.inc.preheader ]		%str.ph.1 = phi i8* [ %incdec.ptr109, %for.body ], [ %str.ph.0, %for.inc.preheader ]
%incdec.ptr109 = getelementptr inbounds i8, i8* %str.ph.1, i32 1		%incdec.ptr109 = getelementptr inbounds i8, i8* %str.ph.1, i32 1
%load.1 = load i8, i8* %incdec.ptr109, align 1		%load.1 = load i8, i8* %incdec.ptr109, align 1
%tobool = icmp ne i8 %load.1, 0		%tobool = icmp ne i8 %load.1, 0
%and = and i1 %cmp, %tobool		%and = and i1 %cmp, %tobool
Show All 10 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[SimplifyCFG] Cost required selects
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 278749

llvm/lib/Transforms/Utils/SimplifyCFG.cpp

llvm/test/Transforms/SimplifyCFG/ARM/select-costs.ll

This is an archive of the discontinued LLVM Phabricator instance.

[SimplifyCFG] Cost required selectsClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 278749

llvm/lib/Transforms/Utils/SimplifyCFG.cpp

llvm/test/Transforms/SimplifyCFG/ARM/select-costs.ll

[SimplifyCFG] Cost required selects
ClosedPublic