This is an archive of the discontinued LLVM Phabricator instance.

[LICM/mustexec] Extend first iteration must exexute logic to fcmps
ClosedPublic

Authored by reames on Mar 15 2018, 2:22 PM.

Download Raw Diff

Details

Reviewers

Commits

rG8a106272e889: [LICM/mustexec] Extend first iteration must execute logic to fcmps
rL327722: [LICM/mustexec] Extend first iteration must execute logic to fcmps

Summary

This builds on the work from https://reviews.llvm.org/D44287. It turned out supporting fcmp was much easier than I realized, so let's do that now.

As an aside, our -O3 handling of a floating point IV leaves a lot to be desired. We do convert the float IV to an integer IV, but do so late enough that many other optimizations are missed (e.g. we don't vectorize).

Diff Detail

Repository: rL LLVM

Event Timeline

reames created this revision.Mar 15 2018, 2:22 PM

Herald added subscribers: bollu, mcrosier. · View Herald TranscriptMar 15 2018, 2:22 PM

reames edited the summary of this revision. (Show Details)Mar 15 2018, 2:23 PM

lgtm!

This revision is now accepted and ready to land.Mar 16 2018, 6:12 AM

Closed by commit rL327722: [LICM/mustexec] Extend first iteration must execute logic to fcmps (authored by reames). · Explain WhyMar 16 2018, 9:36 AM

This revision was automatically updated to reflect the committed changes.

Revision Contents

Path

Size

llvm/

trunk/

lib/

Transforms/

Utils/

LoopUtils.cpp

19 lines

test/

Transforms/

LICM/

hoist-mustexec.ll

28 lines

Diff 138727

llvm/trunk/lib/Transforms/Utils/LoopUtils.cpp

Show First 20 Lines • Show All 1,524 Lines • ▼ Show 20 Lines	static bool CanProveNotTakenFirstIteration(BasicBlock *ExitBlock,
auto *CondExitBlock = ExitBlock->getSinglePredecessor();		auto *CondExitBlock = ExitBlock->getSinglePredecessor();
if (!CondExitBlock)		if (!CondExitBlock)
// expect unique exits		// expect unique exits
return false;		return false;
assert(CurLoop->contains(CondExitBlock) && "meaning of exit block");		assert(CurLoop->contains(CondExitBlock) && "meaning of exit block");
auto *BI = dyn_cast<BranchInst>(CondExitBlock->getTerminator());		auto *BI = dyn_cast<BranchInst>(CondExitBlock->getTerminator());
if (!BI \|\| !BI->isConditional())		if (!BI \|\| !BI->isConditional())
return false;		return false;
// todo: handle fcmp someday		auto *Cond = dyn_cast<CmpInst>(BI->getCondition());
		if (!Cond)
		return false;
// todo: this would be a lot more powerful if we used scev, but all the		// todo: this would be a lot more powerful if we used scev, but all the
// plumbing is currently missing to pass a pointer in from the pass		// plumbing is currently missing to pass a pointer in from the pass
auto *ICI = dyn_cast<ICmpInst>(BI->getCondition());
if (!ICI)
return false;
// Check for cmp (phi [x, preheader] ...), y where (pred x, y is known		// Check for cmp (phi [x, preheader] ...), y where (pred x, y is known
auto *LHS = dyn_cast<PHINode>(ICI->getOperand(0));		auto *LHS = dyn_cast<PHINode>(Cond->getOperand(0));
auto *RHS = ICI->getOperand(1);		auto *RHS = Cond->getOperand(1);
if (!LHS \|\| LHS->getParent() != CurLoop->getHeader())		if (!LHS \|\| LHS->getParent() != CurLoop->getHeader())
return false;		return false;
auto DL = ExitBlock->getModule()->getDataLayout();		auto DL = ExitBlock->getModule()->getDataLayout();
auto *IVStart = LHS->getIncomingValueForBlock(CurLoop->getLoopPreheader());		auto *IVStart = LHS->getIncomingValueForBlock(CurLoop->getLoopPreheader());
auto *SimpleValOrNull = SimplifyICmpInst(ICI->getPredicate(),		auto *SimpleValOrNull = SimplifyCmpInst(Cond->getPredicate(),
IVStart, RHS,		IVStart, RHS,
{DL, /TLI/ nullptr,		{DL, /TLI/ nullptr,
DT, /AC/ nullptr, BI});		DT, /AC/ nullptr, BI});
auto *SimpleCst = dyn_cast_or_null<Constant>(SimpleValOrNull);		auto *SimpleCst = dyn_cast_or_null<Constant>(SimpleValOrNull);
if (!SimpleCst)		if (!SimpleCst)
return false;		return false;
if (ExitBlock == BI->getSuccessor(0))		if (ExitBlock == BI->getSuccessor(0))
return SimpleCst->isZeroValue();		return SimpleCst->isZeroValue();
assert(ExitBlock == BI->getSuccessor(1) && "implied by above");		assert(ExitBlock == BI->getSuccessor(1) && "implied by above");
return SimpleCst->isAllOnesValue();		return SimpleCst->isAllOnesValue();
}		}
▲ Show 20 Lines • Show All 282 Lines • Show Last 20 Lines

llvm/trunk/test/Transforms/LICM/hoist-mustexec.ll

	Show All 27 Lines
	for.cond.cleanup:			for.cond.cleanup:
	ret i32 %add			ret i32 %add

	fail:			fail:
	call void @f()			call void @f()
	ret i32 -1			ret i32 -1
	}			}

				; Same as test1, but with a floating point IR and fcmp
				define i32 @test_fcmp(i32* noalias nocapture readonly %a) nounwind uwtable {
				; CHECK-LABEL: @test_fcmp(
				entry:
				; CHECK: %i1 = load i32, i32* %a, align 4
				; CHECK-NEXT: br label %for.body
				br label %for.body

				for.body:
				%iv = phi float [ 0.0, %entry ], [ %inc, %continue ]
				%acc = phi i32 [ 0, %entry ], [ %add, %continue ]
				%r.chk = fcmp olt float %iv, 2000.0
				br i1 %r.chk, label %continue, label %fail
				continue:
				%i1 = load i32, i32* %a, align 4
				%add = add nsw i32 %i1, %acc
				%inc = fadd float %iv, 1.0
				%exitcond = fcmp ogt float %inc, 1000.0
				br i1 %exitcond, label %for.cond.cleanup, label %for.body

				for.cond.cleanup:
				ret i32 %add

				fail:
				call void @f()
				ret i32 -1
				}

	; Count down from a.length w/entry guard			; Count down from a.length w/entry guard
	; TODO: currently unable to prove the following:			; TODO: currently unable to prove the following:
	; ule i32 (add nsw i32 %len, -1), %len where len is [0, 512]			; ule i32 (add nsw i32 %len, -1), %len where len is [0, 512]
	define i32 @test2(i32* noalias nocapture readonly %a) nounwind uwtable {			define i32 @test2(i32* noalias nocapture readonly %a) nounwind uwtable {
	; CHECK-LABEL: @test2(			; CHECK-LABEL: @test2(
	entry:			entry:
	%len = load i32, i32* %a, align 4, !range !{i32 0, i32 512}			%len = load i32, i32* %a, align 4, !range !{i32 0, i32 512}
	%is.non.pos = icmp eq i32 %len, 0			%is.non.pos = icmp eq i32 %len, 0
	▲ Show 20 Lines • Show All 206 Lines • Show Last 20 Lines