Diff 532563

llvm/lib/CodeGen/CodeGenPrepare.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

Show First 20 Lines • Show All 298 Lines • ▼ Show 20 Lines
class CodeGenPrepare : public FunctionPass {		class CodeGenPrepare : public FunctionPass {
const TargetMachine *TM = nullptr;		const TargetMachine *TM = nullptr;
const TargetSubtargetInfo *SubtargetInfo = nullptr;		const TargetSubtargetInfo *SubtargetInfo = nullptr;
const TargetLowering *TLI = nullptr;		const TargetLowering *TLI = nullptr;
const TargetRegisterInfo *TRI = nullptr;		const TargetRegisterInfo *TRI = nullptr;
const TargetTransformInfo *TTI = nullptr;		const TargetTransformInfo *TTI = nullptr;
const BasicBlockSectionsProfileReader *BBSectionsProfileReader = nullptr;		const BasicBlockSectionsProfileReader *BBSectionsProfileReader = nullptr;
const TargetLibraryInfo *TLInfo = nullptr;		const TargetLibraryInfo *TLInfo = nullptr;
const LoopInfo *LI = nullptr;		LoopInfo *LI = nullptr;
std::unique_ptr<BlockFrequencyInfo> BFI;		std::unique_ptr<BlockFrequencyInfo> BFI;
std::unique_ptr<BranchProbabilityInfo> BPI;		std::unique_ptr<BranchProbabilityInfo> BPI;
ProfileSummaryInfo *PSI = nullptr;		ProfileSummaryInfo *PSI = nullptr;

/// As we scan instructions optimizing them, this is the next instruction		/// As we scan instructions optimizing them, this is the next instruction
/// to optimize. Transforms that can invalidate this should update it.		/// to optimize. Transforms that can invalidate this should update it.
BasicBlock::iterator CurInstIterator;		BasicBlock::iterator CurInstIterator;

▲ Show 20 Lines • Show All 96 Lines • ▼ Show 20 Lines	private:
DominatorTree &getDT(Function &F) {		DominatorTree &getDT(Function &F) {
if (!DT)		if (!DT)
DT = std::make_unique<DominatorTree>(F);		DT = std::make_unique<DominatorTree>(F);
return *DT;		return *DT;
}		}

void removeAllAssertingVHReferences(Value *V);		void removeAllAssertingVHReferences(Value *V);
bool eliminateAssumptions(Function &F);		bool eliminateAssumptions(Function &F);
bool eliminateFallThrough(Function &F);		bool eliminateFallThrough(Function &F, DominatorTree *DT = nullptr);
bool eliminateMostlyEmptyBlocks(Function &F);		bool eliminateMostlyEmptyBlocks(Function &F);
BasicBlock findDestBlockOfMergeableEmptyBlock(BasicBlock BB);		BasicBlock findDestBlockOfMergeableEmptyBlock(BasicBlock BB);
bool canMergeBlocks(const BasicBlock BB, const BasicBlock DestBB) const;		bool canMergeBlocks(const BasicBlock BB, const BasicBlock DestBB) const;
void eliminateMostlyEmptyBlock(BasicBlock *BB);		void eliminateMostlyEmptyBlock(BasicBlock *BB);
bool isMergingEmptyBlockProfitable(BasicBlock BB, BasicBlock DestBB,		bool isMergingEmptyBlockProfitable(BasicBlock BB, BasicBlock DestBB,
bool isPreheader);		bool isPreheader);
bool makeBitReverse(Instruction &I);		bool makeBitReverse(Instruction &I);
bool optimizeBlock(BasicBlock &BB, ModifyDT &ModifiedDT);		bool optimizeBlock(BasicBlock &BB, ModifyDT &ModifiedDT);
▲ Show 20 Lines • Show All 144 Lines • ▼ Show 20 Lines	bool CodeGenPrepare::runOnFunction(Function &F) {
// to help generate sane code for PHIs involving such edges.		// to help generate sane code for PHIs involving such edges.
EverMadeChange \|=		EverMadeChange \|=
SplitIndirectBrCriticalEdges(F, /IgnoreBlocksWithoutPHI=/true);		SplitIndirectBrCriticalEdges(F, /IgnoreBlocksWithoutPHI=/true);

// If we are optimzing huge function, we need to consider the build time.		// If we are optimzing huge function, we need to consider the build time.
// Because the basic algorithm's complex is near O(N!).		// Because the basic algorithm's complex is near O(N!).
IsHugeFunc = F.size() > HugeFuncThresholdInCGPP;		IsHugeFunc = F.size() > HugeFuncThresholdInCGPP;

		// Transformations above may invalidate dominator tree and/or loop info.
		DT.reset();
		LI->releaseMemory();
		LI->analyze(getDT(F));

bool MadeChange = true;		bool MadeChange = true;
bool FuncIterated = false;		bool FuncIterated = false;
while (MadeChange) {		while (MadeChange) {
MadeChange = false;		MadeChange = false;
DT.reset();

for (BasicBlock &BB : llvm::make_early_inc_range(F)) {		for (BasicBlock &BB : llvm::make_early_inc_range(F)) {
if (FuncIterated && !FreshBBs.contains(&BB))		if (FuncIterated && !FreshBBs.contains(&BB))
continue;		continue;

		efriedmaUnsubmitted Done Reply Inline Actions Doing this for every basic block is going to get way too expensive, even for something labeled "expensive". efriedma: Doing this for every basic block is going to get way too expensive, even for something labeled…
ModifyDT ModifiedDTOnIteration = ModifyDT::NotModifyDT;		ModifyDT ModifiedDTOnIteration = ModifyDT::NotModifyDT;
bool Changed = optimizeBlock(BB, ModifiedDTOnIteration);		bool Changed = optimizeBlock(BB, ModifiedDTOnIteration);

		if (ModifiedDTOnIteration == ModifyDT::ModifyBBDT)
		DT.reset();

MadeChange \|= Changed;		MadeChange \|= Changed;
if (IsHugeFunc) {		if (IsHugeFunc) {
// If the BB is updated, it may still has chance to be optimized.		// If the BB is updated, it may still has chance to be optimized.
// This usually happen at sink optimization.		// This usually happen at sink optimization.
// For example:		// For example:
//		//
// bb0：		// bb0：
// %and = and i32 %a, 4		// %and = and i32 %a, 4
// %cmp = icmp eq i32 %and, 0		// %cmp = icmp eq i32 %and, 0
//		//
// If the %cmp sink to other BB, the %and will has chance to sink.		// If the %cmp sink to other BB, the %and will has chance to sink.
if (Changed)		if (Changed)
FreshBBs.insert(&BB);		FreshBBs.insert(&BB);
else if (FuncIterated)		else if (FuncIterated)
FreshBBs.erase(&BB);		FreshBBs.erase(&BB);

if (ModifiedDTOnIteration == ModifyDT::ModifyBBDT)
DT.reset();
} else {		} else {
// For small/normal functions, we restart BB iteration if the dominator		// For small/normal functions, we restart BB iteration if the dominator
// tree of the Function was changed.		// tree of the Function was changed.
if (ModifiedDTOnIteration != ModifyDT::NotModifyDT)		if (ModifiedDTOnIteration != ModifyDT::NotModifyDT)
break;		break;
}		}
}		}
// We have iterated all the BB in the (only work for huge) function.		// We have iterated all the BB in the (only work for huge) function.
FuncIterated = IsHugeFunc;		FuncIterated = IsHugeFunc;

if (EnableTypePromotionMerge && !ValToSExtendedUses.empty())		if (EnableTypePromotionMerge && !ValToSExtendedUses.empty())
MadeChange \|= mergeSExts(F);		MadeChange \|= mergeSExts(F);
if (!LargeOffsetGEPMap.empty())		if (!LargeOffsetGEPMap.empty())
MadeChange \|= splitLargeGEPOffsets();		MadeChange \|= splitLargeGEPOffsets();
MadeChange \|= optimizePhiTypes(F);		MadeChange \|= optimizePhiTypes(F);

if (MadeChange)		if (MadeChange)
eliminateFallThrough(F);		eliminateFallThrough(F, DT.get());

		#ifndef NDEBUG
		if (MadeChange && VerifyLoopInfo)
		efriedmaUnsubmitted Done Reply Inline Actions Weird indentation efriedma: Weird indentation
		LI->verify(getDT(F));
		#endif

// Really free removed instructions during promotion.		// Really free removed instructions during promotion.
for (Instruction *I : RemovedInsts)		for (Instruction *I : RemovedInsts)
I->deleteValue();		I->deleteValue();

EverMadeChange \|= MadeChange;		EverMadeChange \|= MadeChange;
SeenChainsForSExt.clear();		SeenChainsForSExt.clear();
ValToSExtendedUses.clear();		ValToSExtendedUses.clear();
RemovedInsts.clear();		RemovedInsts.clear();
LargeOffsetGEPMap.clear();		LargeOffsetGEPMap.clear();
LargeOffsetGEPID.clear();		LargeOffsetGEPID.clear();
}		}

NewGEPBases.clear();		NewGEPBases.clear();
SunkAddrs.clear();		SunkAddrs.clear();

if (!DisableBranchOpts) {		if (!DisableBranchOpts) {
MadeChange = false;		MadeChange = false;
// Use a set vector to get deterministic iteration order. The order the		// Use a set vector to get deterministic iteration order. The order the
// blocks are removed may affect whether or not PHI nodes in successors		// blocks are removed may affect whether or not PHI nodes in successors
// are removed.		// are removed.
		efriedmaUnsubmitted Done Reply Inline Actions Given the way the code is structured, isn't this always running just after you've just called releaseMemory()/analyze() on LI? efriedma: Given the way the code is structured, isn't this always running just after you've just called…
		chillAuthorUnsubmitted Done Reply Inline Actions D'oh, indeed, after we exit the loop because of `MadeChange` being `false` it means all the code after `LI->analyze` didn't do anything, including changing the loop structure. chill: D'oh, indeed, after we exit the loop because of `MadeChange` being `false` it means all the…
SmallSetVector<BasicBlock *, 8> WorkList;		SmallSetVector<BasicBlock *, 8> WorkList;
for (BasicBlock &BB : F) {		for (BasicBlock &BB : F) {
SmallVector<BasicBlock *, 2> Successors(successors(&BB));		SmallVector<BasicBlock *, 2> Successors(successors(&BB));
MadeChange \|= ConstantFoldTerminator(&BB, true);		MadeChange \|= ConstantFoldTerminator(&BB, true);
if (!MadeChange)		if (!MadeChange)
continue;		continue;

for (BasicBlock *Succ : Successors)		for (BasicBlock *Succ : Successors)
▲ Show 20 Lines • Show All 95 Lines • ▼ Show 20 Lines	void LLVM_ATTRIBUTE_UNUSED CodeGenPrepare::verifyBFIUpdates(Function &F) {
BranchProbabilityInfo NewBPI(F, NewLI, TLInfo);		BranchProbabilityInfo NewBPI(F, NewLI, TLInfo);
BlockFrequencyInfo NewBFI(F, NewBPI, NewLI);		BlockFrequencyInfo NewBFI(F, NewBPI, NewLI);
NewBFI.verifyMatch(*BFI);		NewBFI.verifyMatch(*BFI);
}		}

/// Merge basic blocks which are connected by a single edge, where one of the		/// Merge basic blocks which are connected by a single edge, where one of the
/// basic blocks has a single successor pointing to the other basic block,		/// basic blocks has a single successor pointing to the other basic block,
/// which has a single predecessor.		/// which has a single predecessor.
bool CodeGenPrepare::eliminateFallThrough(Function &F) {		bool CodeGenPrepare::eliminateFallThrough(Function &F, DominatorTree *DT) {
bool Changed = false;		bool Changed = false;
// Scan all of the blocks in the function, except for the entry block.		// Scan all of the blocks in the function, except for the entry block.
// Use a temporary array to avoid iterator being invalidated when		// Use a temporary array to avoid iterator being invalidated when
// deleting blocks.		// deleting blocks.
SmallVector<WeakTrackingVH, 16> Blocks;		SmallVector<WeakTrackingVH, 16> Blocks;
for (auto &Block : llvm::drop_begin(F))		for (auto &Block : llvm::drop_begin(F))
Blocks.push_back(&Block);		Blocks.push_back(&Block);

SmallSet<WeakTrackingVH, 16> Preds;		SmallSet<WeakTrackingVH, 16> Preds;
for (auto &Block : Blocks) {		for (auto &Block : Blocks) {
auto *BB = cast_or_null<BasicBlock>(Block);		auto *BB = cast_or_null<BasicBlock>(Block);
if (!BB)		if (!BB)
continue;		continue;
// If the destination block has a single pred, then this is a trivial		// If the destination block has a single pred, then this is a trivial
// edge, just collapse it.		// edge, just collapse it.
BasicBlock *SinglePred = BB->getSinglePredecessor();		BasicBlock *SinglePred = BB->getSinglePredecessor();

// Don't merge if BB's address is taken.		// Don't merge if BB's address is taken.
if (!SinglePred \|\| SinglePred == BB \|\| BB->hasAddressTaken())		if (!SinglePred \|\| SinglePred == BB \|\| BB->hasAddressTaken())
continue;		continue;

		// Make an effort to skip unreachable blocks.
		if (DT && !DT->isReachableFromEntry(BB))
		continue;

BranchInst *Term = dyn_cast<BranchInst>(SinglePred->getTerminator());		BranchInst *Term = dyn_cast<BranchInst>(SinglePred->getTerminator());
if (Term && !Term->isConditional()) {		if (Term && !Term->isConditional()) {
Changed = true;		Changed = true;
LLVM_DEBUG(dbgs() << "To merge:\n" << *BB << "\n\n\n");		LLVM_DEBUG(dbgs() << "To merge:\n" << *BB << "\n\n\n");

// Merge BB into SinglePred and delete it.		// Merge BB into SinglePred and delete it.
MergeBlockIntoPredecessor(BB);		MergeBlockIntoPredecessor(BB, /* DTU / nullptr, LI, / MSSAU */ nullptr,
		/* MemDep */ nullptr,
		/* PredecessorWithTwoSuccessors */ false, DT);
Preds.insert(SinglePred);		Preds.insert(SinglePred);

if (IsHugeFunc) {		if (IsHugeFunc) {
// Update FreshBBs to optimize the merged BB.		// Update FreshBBs to optimize the merged BB.
FreshBBs.insert(SinglePred);		FreshBBs.insert(SinglePred);
FreshBBs.erase(BB);		FreshBBs.erase(BB);
}		}
}		}
▲ Show 20 Lines • Show All 1,365 Lines • ▼ Show 20 Lines
/// cond.false:		/// cond.false:
/// %z = call i64 @llvm.cttz.i64(i64 %A, i1 true)		/// %z = call i64 @llvm.cttz.i64(i64 %A, i1 true)
/// br label %cond.end		/// br label %cond.end
/// cond.end:		/// cond.end:
/// %ctz = phi i64 [ 64, %entry ], [ %z, %cond.false ]		/// %ctz = phi i64 [ 64, %entry ], [ %z, %cond.false ]
///		///
/// If the transform is performed, return true and set ModifiedDT to true.		/// If the transform is performed, return true and set ModifiedDT to true.
static bool despeculateCountZeros(IntrinsicInst *CountZeros,		static bool despeculateCountZeros(IntrinsicInst *CountZeros,
		LoopInfo &LI,
const TargetLowering *TLI,		const TargetLowering *TLI,
const DataLayout *DL, ModifyDT &ModifiedDT,		const DataLayout *DL, ModifyDT &ModifiedDT,
SmallSet<BasicBlock *, 32> &FreshBBs,		SmallSet<BasicBlock *, 32> &FreshBBs,
bool IsHugeFunc) {		bool IsHugeFunc) {
// If a zero input is undefined, it doesn't make sense to despeculate that.		// If a zero input is undefined, it doesn't make sense to despeculate that.
if (match(CountZeros->getOperand(1), m_One()))		if (match(CountZeros->getOperand(1), m_One()))
return false;		return false;

Show All 23 Lines	static bool despeculateCountZeros(IntrinsicInst *CountZeros,
// Create another block after the count zero intrinsic. A PHI will be added		// Create another block after the count zero intrinsic. A PHI will be added
// in this block to select the result of the intrinsic or the bit-width		// in this block to select the result of the intrinsic or the bit-width
// constant if the input to the intrinsic is zero.		// constant if the input to the intrinsic is zero.
BasicBlock::iterator SplitPt = ++(BasicBlock::iterator(CountZeros));		BasicBlock::iterator SplitPt = ++(BasicBlock::iterator(CountZeros));
BasicBlock *EndBlock = CallBlock->splitBasicBlock(SplitPt, "cond.end");		BasicBlock *EndBlock = CallBlock->splitBasicBlock(SplitPt, "cond.end");
if (IsHugeFunc)		if (IsHugeFunc)
FreshBBs.insert(EndBlock);		FreshBBs.insert(EndBlock);

		// Update the LoopInfo. The new blocks are in the same loop as the start
		// block.
		if (Loop *L = LI.getLoopFor(StartBlock)) {
		L->addBasicBlockToLoop(CallBlock, LI);
		efriedmaUnsubmitted Done Reply Inline Actions Wrong indentatation. efriedma: Wrong indentatation.
		L->addBasicBlockToLoop(EndBlock, LI);
		}

// Set up a builder to create a compare, conditional branch, and PHI.		// Set up a builder to create a compare, conditional branch, and PHI.
IRBuilder<> Builder(CountZeros->getContext());		IRBuilder<> Builder(CountZeros->getContext());
Builder.SetInsertPoint(StartBlock->getTerminator());		Builder.SetInsertPoint(StartBlock->getTerminator());
Builder.SetCurrentDebugLocation(CountZeros->getDebugLoc());		Builder.SetCurrentDebugLocation(CountZeros->getDebugLoc());

// Replace the unconditional branch that was created by the first split with		// Replace the unconditional branch that was created by the first split with
// a compare against zero and a conditional branch.		// a compare against zero and a conditional branch.
Value *Zero = Constant::getNullValue(Ty);		Value *Zero = Constant::getNullValue(Ty);
▲ Show 20 Lines • Show All 158 Lines • ▼ Show 20 Lines	case Intrinsic::strip_invariant_group: {

replaceAllUsesWith(II, ArgVal, FreshBBs, IsHugeFunc);		replaceAllUsesWith(II, ArgVal, FreshBBs, IsHugeFunc);
II->eraseFromParent();		II->eraseFromParent();
return true;		return true;
}		}
case Intrinsic::cttz:		case Intrinsic::cttz:
case Intrinsic::ctlz:		case Intrinsic::ctlz:
// If counting zeros is expensive, try to avoid it.		// If counting zeros is expensive, try to avoid it.
return despeculateCountZeros(II, TLI, DL, ModifiedDT, FreshBBs,		return despeculateCountZeros(II, *LI, TLI, DL, ModifiedDT, FreshBBs,
IsHugeFunc);		IsHugeFunc);
case Intrinsic::fshl:		case Intrinsic::fshl:
case Intrinsic::fshr:		case Intrinsic::fshr:
return optimizeFunnelShift(II);		return optimizeFunnelShift(II);
case Intrinsic::dbg_assign:		case Intrinsic::dbg_assign:
case Intrinsic::dbg_value:		case Intrinsic::dbg_value:
return fixupDbgValue(II);		return fixupDbgValue(II);
case Intrinsic::masked_gather:		case Intrinsic::masked_gather:
▲ Show 20 Lines • Show All 66 Lines • ▼ Show 20 Lines	bool CodeGenPrepare::dupRetToEnableTailCallOpts(BasicBlock *BB,
ModifyDT &ModifiedDT) {		ModifyDT &ModifiedDT) {
if (!BB->getTerminator())		if (!BB->getTerminator())
return false;		return false;

ReturnInst *RetI = dyn_cast<ReturnInst>(BB->getTerminator());		ReturnInst *RetI = dyn_cast<ReturnInst>(BB->getTerminator());
if (!RetI)		if (!RetI)
return false;		return false;

		assert(LI->getLoopFor(BB) == nullptr && "A return block cannot be in a loop");

PHINode *PN = nullptr;		PHINode *PN = nullptr;
ExtractValueInst *EVI = nullptr;		ExtractValueInst *EVI = nullptr;
BitCastInst *BCI = nullptr;		BitCastInst *BCI = nullptr;
Value *V = RetI->getReturnValue();		Value *V = RetI->getReturnValue();
if (V) {		if (V) {
BCI = dyn_cast<BitCastInst>(V);		BCI = dyn_cast<BitCastInst>(V);
if (BCI)		if (BCI)
V = BCI->getOperand(0);		V = BCI->getOperand(0);
▲ Show 20 Lines • Show All 3,635 Lines • ▼ Show 20 Lines	while (LargeOffsetGEP != LargeOffsetGEPs.end()) {
if (auto *BaseI = dyn_cast<Instruction>(OldBase)) {		if (auto *BaseI = dyn_cast<Instruction>(OldBase)) {
// If the base of the struct is an instruction, the new base will be		// If the base of the struct is an instruction, the new base will be
// inserted close to it.		// inserted close to it.
NewBaseInsertBB = BaseI->getParent();		NewBaseInsertBB = BaseI->getParent();
if (isa<PHINode>(BaseI))		if (isa<PHINode>(BaseI))
NewBaseInsertPt = NewBaseInsertBB->getFirstInsertionPt();		NewBaseInsertPt = NewBaseInsertBB->getFirstInsertionPt();
else if (InvokeInst *Invoke = dyn_cast<InvokeInst>(BaseI)) {		else if (InvokeInst *Invoke = dyn_cast<InvokeInst>(BaseI)) {
NewBaseInsertBB =		NewBaseInsertBB =
SplitEdge(NewBaseInsertBB, Invoke->getNormalDest());		SplitEdge(NewBaseInsertBB, Invoke->getNormalDest(), DT.get(), LI);
NewBaseInsertPt = NewBaseInsertBB->getFirstInsertionPt();		NewBaseInsertPt = NewBaseInsertBB->getFirstInsertionPt();
} else		} else
NewBaseInsertPt = std::next(BaseI->getIterator());		NewBaseInsertPt = std::next(BaseI->getIterator());
} else {		} else {
// If the current base is an argument or global value, the new base		// If the current base is an argument or global value, the new base
// will be inserted to the entry block.		// will be inserted to the entry block.
NewBaseInsertBB = &BaseGEP->getFunction()->getEntryBlock();		NewBaseInsertBB = &BaseGEP->getFunction()->getEntryBlock();
NewBaseInsertPt = NewBaseInsertBB->getFirstInsertionPt();		NewBaseInsertPt = NewBaseInsertBB->getFirstInsertionPt();
▲ Show 20 Lines • Show All 837 Lines • ▼ Show 20 Lines	bool CodeGenPrepare::optimizeSelectInst(SelectInst *SI) {
// If the true or false blocks do not contain a sunken instruction, that		// If the true or false blocks do not contain a sunken instruction, that
// block and its branch may be optimized away. In that case, one side of the		// block and its branch may be optimized away. In that case, one side of the
// first branch will point directly to select.end, and the corresponding PHI		// first branch will point directly to select.end, and the corresponding PHI
// predecessor block will be the start block.		// predecessor block will be the start block.

// First, we split the block containing the select into 2 blocks.		// First, we split the block containing the select into 2 blocks.
BasicBlock *StartBlock = SI->getParent();		BasicBlock *StartBlock = SI->getParent();
BasicBlock::iterator SplitPt = ++(BasicBlock::iterator(LastSI));		BasicBlock::iterator SplitPt = ++(BasicBlock::iterator(LastSI));
BasicBlock *EndBlock = StartBlock->splitBasicBlock(SplitPt, "select.end");		BasicBlock *EndBlock = StartBlock->splitBasicBlock(SplitPt, "select.end");
		efriedmaUnsubmitted Not Done Reply Inline Actions I think we have a SplitBasicBlock utility that handles DT/LI automatically, but I don't want to make any complex refactorings block this. efriedma: I think we have a SplitBasicBlock utility that handles DT/LI automatically, but I don't want to…
if (IsHugeFunc)		if (IsHugeFunc)
FreshBBs.insert(EndBlock);		FreshBBs.insert(EndBlock);
		Loop *L = LI->getLoopFor(StartBlock);
		if (L)
		L->addBasicBlockToLoop(EndBlock, *LI);
BFI->setBlockFreq(EndBlock, BFI->getBlockFreq(StartBlock).getFrequency());		BFI->setBlockFreq(EndBlock, BFI->getBlockFreq(StartBlock).getFrequency());

// Delete the unconditional branch that was just created by the split.		// Delete the unconditional branch that was just created by the split.
StartBlock->getTerminator()->eraseFromParent();		StartBlock->getTerminator()->eraseFromParent();

// These are the new basic blocks for the conditional branch.		// These are the new basic blocks for the conditional branch.
// At least one will become an actual new basic block.		// At least one will become an actual new basic block.
BasicBlock *TrueBlock = nullptr;		BasicBlock *TrueBlock = nullptr;
BasicBlock *FalseBlock = nullptr;		BasicBlock *FalseBlock = nullptr;
BranchInst *TrueBranch = nullptr;		BranchInst *TrueBranch = nullptr;
BranchInst *FalseBranch = nullptr;		BranchInst *FalseBranch = nullptr;

// Sink expensive instructions into the conditional blocks to avoid executing		// Sink expensive instructions into the conditional blocks to avoid executing
// them speculatively.		// them speculatively.
for (SelectInst *SI : ASI) {		for (SelectInst *SI : ASI) {
if (sinkSelectOperand(TTI, SI->getTrueValue())) {		if (sinkSelectOperand(TTI, SI->getTrueValue())) {
if (TrueBlock == nullptr) {		if (TrueBlock == nullptr) {
TrueBlock = BasicBlock::Create(SI->getContext(), "select.true.sink",		TrueBlock = BasicBlock::Create(SI->getContext(), "select.true.sink",
EndBlock->getParent(), EndBlock);		EndBlock->getParent(), EndBlock);
TrueBranch = BranchInst::Create(EndBlock, TrueBlock);		TrueBranch = BranchInst::Create(EndBlock, TrueBlock);
if (IsHugeFunc)		if (IsHugeFunc)
FreshBBs.insert(TrueBlock);		FreshBBs.insert(TrueBlock);
		if (L)
		L->addBasicBlockToLoop(TrueBlock, *LI);
TrueBranch->setDebugLoc(SI->getDebugLoc());		TrueBranch->setDebugLoc(SI->getDebugLoc());
}		}
auto *TrueInst = cast<Instruction>(SI->getTrueValue());		auto *TrueInst = cast<Instruction>(SI->getTrueValue());
TrueInst->moveBefore(TrueBranch);		TrueInst->moveBefore(TrueBranch);
}		}
if (sinkSelectOperand(TTI, SI->getFalseValue())) {		if (sinkSelectOperand(TTI, SI->getFalseValue())) {
if (FalseBlock == nullptr) {		if (FalseBlock == nullptr) {
FalseBlock = BasicBlock::Create(SI->getContext(), "select.false.sink",		FalseBlock = BasicBlock::Create(SI->getContext(), "select.false.sink",
EndBlock->getParent(), EndBlock);		EndBlock->getParent(), EndBlock);
if (IsHugeFunc)		if (IsHugeFunc)
FreshBBs.insert(FalseBlock);		FreshBBs.insert(FalseBlock);
		if (L)
		L->addBasicBlockToLoop(FalseBlock, *LI);
FalseBranch = BranchInst::Create(EndBlock, FalseBlock);		FalseBranch = BranchInst::Create(EndBlock, FalseBlock);
FalseBranch->setDebugLoc(SI->getDebugLoc());		FalseBranch->setDebugLoc(SI->getDebugLoc());
}		}
auto *FalseInst = cast<Instruction>(SI->getFalseValue());		auto *FalseInst = cast<Instruction>(SI->getFalseValue());
FalseInst->moveBefore(FalseBranch);		FalseInst->moveBefore(FalseBranch);
}		}
}		}

// If there was nothing to sink, then arbitrarily choose the 'false' side		// If there was nothing to sink, then arbitrarily choose the 'false' side
// for a new input value to the PHI.		// for a new input value to the PHI.
if (TrueBlock == FalseBlock) {		if (TrueBlock == FalseBlock) {
assert(TrueBlock == nullptr &&		assert(TrueBlock == nullptr &&
"Unexpected basic block transform while optimizing select");		"Unexpected basic block transform while optimizing select");

FalseBlock = BasicBlock::Create(SI->getContext(), "select.false",		FalseBlock = BasicBlock::Create(SI->getContext(), "select.false",
EndBlock->getParent(), EndBlock);		EndBlock->getParent(), EndBlock);
if (IsHugeFunc)		if (IsHugeFunc)
FreshBBs.insert(FalseBlock);		FreshBBs.insert(FalseBlock);
		if (L)
		L->addBasicBlockToLoop(FalseBlock, *LI);
auto *FalseBranch = BranchInst::Create(EndBlock, FalseBlock);		auto *FalseBranch = BranchInst::Create(EndBlock, FalseBlock);
FalseBranch->setDebugLoc(SI->getDebugLoc());		FalseBranch->setDebugLoc(SI->getDebugLoc());
}		}

// Insert the real conditional branch based on the original condition.		// Insert the real conditional branch based on the original condition.
// If we did not create a new block for one of the 'true' or 'false' paths		// If we did not create a new block for one of the 'true' or 'false' paths
// of the condition, it means that side of the branch goes to the end block		// of the condition, it means that side of the branch goes to the end block
// directly and the path originates from the start block from the point of		// directly and the path originates from the start block from the point of
▲ Show 20 Lines • Show All 1,596 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[CodeGenPrepare] Fix for using outdated/corrupt LoopInfo
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 532563

llvm/lib/CodeGen/CodeGenPrepare.cpp

This is an archive of the discontinued LLVM Phabricator instance.

[CodeGenPrepare] Fix for using outdated/corrupt LoopInfoClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 532563

llvm/lib/CodeGen/CodeGenPrepare.cpp

[CodeGenPrepare] Fix for using outdated/corrupt LoopInfo
ClosedPublic