Diff 229873

llvm/include/llvm/Analysis/BranchProbabilityInfo.h

Show All 28 Lines
#include <cstdint>		#include <cstdint>
#include <utility>		#include <utility>

namespace llvm {		namespace llvm {

class Function;		class Function;
class LoopInfo;		class LoopInfo;
class raw_ostream;		class raw_ostream;
		class PostDominatorTree;
class TargetLibraryInfo;		class TargetLibraryInfo;
class Value;		class Value;

/// Analysis providing branch probability information.		/// Analysis providing branch probability information.
///		///
/// This is a function analysis which provides information on the relative		/// This is a function analysis which provides information on the relative
/// probabilities of each "edge" in the function's CFG where such an edge is		/// probabilities of each "edge" in the function's CFG where such an edge is
/// defined by a pair (PredBlock and an index in the successors). The		/// defined by a pair (PredBlock and an index in the successors). The
▲ Show 20 Lines • Show All 137 Lines • ▼ Show 20 Lines	private:
const Function *LastF = nullptr;		const Function *LastF = nullptr;

/// Track the set of blocks directly succeeded by a returning block.		/// Track the set of blocks directly succeeded by a returning block.
SmallPtrSet<const BasicBlock *, 16> PostDominatedByUnreachable;		SmallPtrSet<const BasicBlock *, 16> PostDominatedByUnreachable;

/// Track the set of blocks that always lead to a cold call.		/// Track the set of blocks that always lead to a cold call.
SmallPtrSet<const BasicBlock *, 16> PostDominatedByColdCall;		SmallPtrSet<const BasicBlock *, 16> PostDominatedByColdCall;

void updatePostDominatedByUnreachable(const BasicBlock *BB);		void computePostDominatedByUnreachable(const Function &F,
void updatePostDominatedByColdCall(const BasicBlock *BB);		PostDominatorTree *PDT);
		void computePostDominatedByColdCall(const Function &F,
		PostDominatorTree *PDT);
bool calcUnreachableHeuristics(const BasicBlock *BB);		bool calcUnreachableHeuristics(const BasicBlock *BB);
bool calcMetadataWeights(const BasicBlock *BB);		bool calcMetadataWeights(const BasicBlock *BB);
bool calcColdCallHeuristics(const BasicBlock *BB);		bool calcColdCallHeuristics(const BasicBlock *BB);
bool calcPointerHeuristics(const BasicBlock *BB);		bool calcPointerHeuristics(const BasicBlock *BB);
bool calcLoopBranchHeuristics(const BasicBlock *BB, const LoopInfo &LI,		bool calcLoopBranchHeuristics(const BasicBlock *BB, const LoopInfo &LI,
SccInfo &SccI);		SccInfo &SccI);
bool calcZeroHeuristics(const BasicBlock BB, const TargetLibraryInfo TLI);		bool calcZeroHeuristics(const BasicBlock BB, const TargetLibraryInfo TLI);
bool calcFloatingPointHeuristics(const BasicBlock *BB);		bool calcFloatingPointHeuristics(const BasicBlock *BB);
▲ Show 20 Lines • Show All 50 Lines • Show Last 20 Lines

llvm/lib/Analysis/BranchProbabilityInfo.cpp

Show All 10 Lines
//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//

#include "llvm/Analysis/BranchProbabilityInfo.h"		#include "llvm/Analysis/BranchProbabilityInfo.h"
#include "llvm/ADT/PostOrderIterator.h"		#include "llvm/ADT/PostOrderIterator.h"
#include "llvm/ADT/SCCIterator.h"		#include "llvm/ADT/SCCIterator.h"
#include "llvm/ADT/STLExtras.h"		#include "llvm/ADT/STLExtras.h"
#include "llvm/ADT/SmallVector.h"		#include "llvm/ADT/SmallVector.h"
#include "llvm/Analysis/LoopInfo.h"		#include "llvm/Analysis/LoopInfo.h"
		#include "llvm/Analysis/PostDominators.h"
#include "llvm/Analysis/TargetLibraryInfo.h"		#include "llvm/Analysis/TargetLibraryInfo.h"
#include "llvm/IR/Attributes.h"		#include "llvm/IR/Attributes.h"
#include "llvm/IR/BasicBlock.h"		#include "llvm/IR/BasicBlock.h"
#include "llvm/IR/CFG.h"		#include "llvm/IR/CFG.h"
#include "llvm/IR/Constants.h"		#include "llvm/IR/Constants.h"
#include "llvm/IR/Dominators.h"		#include "llvm/IR/Dominators.h"
#include "llvm/IR/Function.h"		#include "llvm/IR/Function.h"
#include "llvm/IR/InstrTypes.h"		#include "llvm/IR/InstrTypes.h"
▲ Show 20 Lines • Show All 114 Lines • ▼ Show 20 Lines
static const uint32_t IH_TAKEN_WEIGHT = 1024 * 1024 - 1;		static const uint32_t IH_TAKEN_WEIGHT = 1024 * 1024 - 1;

/// Invoke-terminating normal branch not-taken weight.		/// Invoke-terminating normal branch not-taken weight.
///		///
/// This is the weight for branching to the unwind destination of an invoke		/// This is the weight for branching to the unwind destination of an invoke
/// instruction. This is essentially never taken.		/// instruction. This is essentially never taken.
static const uint32_t IH_NONTAKEN_WEIGHT = 1;		static const uint32_t IH_NONTAKEN_WEIGHT = 1;

/// Add \p BB to PostDominatedByUnreachable set if applicable.		static void UpdatePDTWorklist(const BasicBlock BB, PostDominatorTree PDT,
void		SmallVectorImpl<const BasicBlock *> &WorkList,
BranchProbabilityInfo::updatePostDominatedByUnreachable(const BasicBlock *BB) {		SmallPtrSetImpl<const BasicBlock *> &TargetSet) {
const Instruction *TI = BB->getTerminator();		SmallVector<BasicBlock *, 8> Descendants;
		SmallPtrSet<const BasicBlock *, 16> NewItems;

		PDT->getDescendants(const_cast<BasicBlock *>(BB), Descendants);
		for (auto *BB : Descendants)
		if (TargetSet.insert(BB).second)
		NewItems.insert(pred_begin(BB), pred_end(BB));
		skatkovUnsubmitted Not Done Reply Inline Actions Theoretically predecessor might be already marked in TargetSet so you could potentially filter the adding list of predecessors. skatkov: Theoretically predecessor might be already marked in TargetSet so you could potentially filter…
		WorkList.insert(WorkList.end(), NewItems.begin(), NewItems.end());
		}

		/// Compute a set of basic blocks that are post-dominated by unreachables.
		void BranchProbabilityInfo::computePostDominatedByUnreachable(
		const Function &F, PostDominatorTree *PDT) {
		SmallVector<const BasicBlock *, 8> WorkList;
		for (auto &BB : F) {
		const Instruction *TI = BB.getTerminator();
if (TI->getNumSuccessors() == 0) {		if (TI->getNumSuccessors() == 0) {
if (isa<UnreachableInst>(TI) \|\|		if (isa<UnreachableInst>(TI) \|\|
// If this block is terminated by a call to		// If this block is terminated by a call to
// @llvm.experimental.deoptimize then treat it like an unreachable since		// @llvm.experimental.deoptimize then treat it like an unreachable
// the @llvm.experimental.deoptimize call is expected to practically		// since the @llvm.experimental.deoptimize call is expected to
// never execute.		// practically never execute.
BB->getTerminatingDeoptimizeCall())		BB.getTerminatingDeoptimizeCall())
PostDominatedByUnreachable.insert(BB);		UpdatePDTWorklist(&BB, PDT, WorkList, PostDominatedByUnreachable);
return;		}
}		}

// If the terminator is an InvokeInst, check only the normal destination block		while (!WorkList.empty()) {
// as the unwind edge of InvokeInst is also very unlikely taken.		const BasicBlock *BB = WorkList.pop_back_val();
if (auto *II = dyn_cast<InvokeInst>(TI)) {		if (PostDominatedByUnreachable.count(BB))
		continue;
		// If the terminator is an InvokeInst, check only the normal destination
		// block as the unwind edge of InvokeInst is also very unlikely taken.
		if (auto *II = dyn_cast<InvokeInst>(BB->getTerminator())) {
if (PostDominatedByUnreachable.count(II->getNormalDest()))		if (PostDominatedByUnreachable.count(II->getNormalDest()))
PostDominatedByUnreachable.insert(BB);		UpdatePDTWorklist(BB, PDT, WorkList, PostDominatedByUnreachable);
return;		}
		// If all the successors are unreachable, BB is unreachable as well.
		else if (!successors(BB).empty() &&
		llvm::all_of(successors(BB), [this](const BasicBlock *Succ) {
		return PostDominatedByUnreachable.count(Succ);
		}))
		UpdatePDTWorklist(BB, PDT, WorkList, PostDominatedByUnreachable);
}		}

for (auto *I : successors(BB))
// If any of successor is not post dominated then BB is also not.
if (!PostDominatedByUnreachable.count(I))
return;

PostDominatedByUnreachable.insert(BB);
}		}

/// Add \p BB to PostDominatedByColdCall set if applicable.		/// compute a set of basic blocks that are post-dominated by ColdCalls.
void		void BranchProbabilityInfo::computePostDominatedByColdCall(
BranchProbabilityInfo::updatePostDominatedByColdCall(const BasicBlock *BB) {		const Function &F, PostDominatorTree *PDT) {
assert(!PostDominatedByColdCall.count(BB));		SmallVector<const BasicBlock *, 8> WorkList;
const Instruction *TI = BB->getTerminator();		for (auto &BB : F)
if (TI->getNumSuccessors() == 0)		for (auto &I : BB)
return;		if (const CallInst *CI = dyn_cast<CallInst>(&I))
		if (CI->hasFnAttr(Attribute::Cold))
		UpdatePDTWorklist(&BB, PDT, WorkList, PostDominatedByColdCall);

// If all of successor are post dominated then BB is also done.		while (!WorkList.empty()) {
if (llvm::all_of(successors(BB), [&](const BasicBlock *SuccBB) {		const BasicBlock *BB = WorkList.pop_back_val();
return PostDominatedByColdCall.count(SuccBB);
})) {
PostDominatedByColdCall.insert(BB);
return;
}

// If the terminator is an InvokeInst, check only the normal destination		// If the terminator is an InvokeInst, check only the normal destination
// block as the unwind edge of InvokeInst is also very unlikely taken.		// block as the unwind edge of InvokeInst is also very unlikely taken.
if (auto *II = dyn_cast<InvokeInst>(TI))		if (auto *II = dyn_cast<InvokeInst>(BB->getTerminator())) {
if (PostDominatedByColdCall.count(II->getNormalDest())) {		if (PostDominatedByColdCall.count(II->getNormalDest()))
PostDominatedByColdCall.insert(BB);		UpdatePDTWorklist(BB, PDT, WorkList, PostDominatedByColdCall);
return;
}		}
		// If all of successor are post dominated then BB is also done.
// Otherwise, if the block itself contains a cold function, add it to the		else if (!successors(BB).empty() &&
// set of blocks post-dominated by a cold call.		llvm::all_of(successors(BB), [this](const BasicBlock *Succ) {
for (auto &I : *BB)		return PostDominatedByColdCall.count(Succ);
if (const CallInst *CI = dyn_cast<CallInst>(&I))		}))
if (CI->hasFnAttr(Attribute::Cold)) {		UpdatePDTWorklist(BB, PDT, WorkList, PostDominatedByColdCall);
PostDominatedByColdCall.insert(BB);
return;
}		}
}		}

/// Calculate edge weights for successors lead to unreachable.		/// Calculate edge weights for successors lead to unreachable.
///		///
/// Predict that a successor which leads necessarily to an		/// Predict that a successor which leads necessarily to an
/// unreachable-terminated block as extremely unlikely.		/// unreachable-terminated block as extremely unlikely.
bool BranchProbabilityInfo::calcUnreachableHeuristics(const BasicBlock *BB) {		bool BranchProbabilityInfo::calcUnreachableHeuristics(const BasicBlock *BB) {
const Instruction *TI = BB->getTerminator();		const Instruction *TI = BB->getTerminator();
▲ Show 20 Lines • Show All 758 Lines • ▼ Show 20 Lines	for (scc_iterator<const Function *> It = scc_begin(&F); !It.isAtEnd();
LLVM_DEBUG(dbgs() << "BPI: SCC " << SccNum << ":");		LLVM_DEBUG(dbgs() << "BPI: SCC " << SccNum << ":");
for (auto *BB : Scc) {		for (auto *BB : Scc) {
LLVM_DEBUG(dbgs() << " " << BB->getName());		LLVM_DEBUG(dbgs() << " " << BB->getName());
SccI.SccNums[BB] = SccNum;		SccI.SccNums[BB] = SccNum;
}		}
LLVM_DEBUG(dbgs() << "\n");		LLVM_DEBUG(dbgs() << "\n");
}		}

		std::unique_ptr<PostDominatorTree> PDT =
		std::make_unique<PostDominatorTree>(const_cast<Function &>(F));
		computePostDominatedByUnreachable(F, PDT.get());
		computePostDominatedByColdCall(F, PDT.get());

// Walk the basic blocks in post-order so that we can build up state about		// Walk the basic blocks in post-order so that we can build up state about
// the successors of a block iteratively.		// the successors of a block iteratively.
for (auto BB : post_order(&F.getEntryBlock())) {		for (auto BB : post_order(&F.getEntryBlock())) {
LLVM_DEBUG(dbgs() << "Computing probabilities for " << BB->getName()		LLVM_DEBUG(dbgs() << "Computing probabilities for " << BB->getName()
<< "\n");		<< "\n");
updatePostDominatedByUnreachable(BB);
updatePostDominatedByColdCall(BB);
// If there is no at least two successors, no sense to set probability.		// If there is no at least two successors, no sense to set probability.
if (BB->getTerminator()->getNumSuccessors() < 2)		if (BB->getTerminator()->getNumSuccessors() < 2)
continue;		continue;
if (calcMetadataWeights(BB))		if (calcMetadataWeights(BB))
continue;		continue;
if (calcInvokeHeuristics(BB))		if (calcInvokeHeuristics(BB))
continue;		continue;
if (calcUnreachableHeuristics(BB))		if (calcUnreachableHeuristics(BB))
▲ Show 20 Lines • Show All 65 Lines • Show Last 20 Lines

llvm/test/Analysis/BranchProbabilityInfo/basic.ll

Show First 20 Lines • Show All 135 Lines • ▼ Show 20 Lines	else:
br label %exit		br label %exit
; CHECK: edge else -> exit probability is 0x80000000 / 0x80000000 = 100.00% [HOT edge]		; CHECK: edge else -> exit probability is 0x80000000 / 0x80000000 = 100.00% [HOT edge]

exit:		exit:
%result = phi i32 [ %a, %then ], [ %b, %else ]		%result = phi i32 [ %a, %then ], [ %b, %else ]
ret i32 %result		ret i32 %result
}		}

		define i32 @test_cold_loop(i32 %a, i32 %b) {
		entry:
		%cond1 = icmp eq i32 %a, 42
		br i1 %cond1, label %header, label %exit

		header:
		br label %body

		body:
		%cond2 = icmp eq i32 %b, 42
		br i1 %cond2, label %header, label %exit
		; CHECK: edge body -> header probability is 0x40000000 / 0x80000000 = 50.00%

		exit:
		call void @coldfunc()
		ret i32 %b
		}

declare i32 @regular_function(i32 %i)		declare i32 @regular_function(i32 %i)

define i32 @test_cold_call_sites_with_prof(i32 %a, i32 %b, i1 %flag, i1 %flag2) {		define i32 @test_cold_call_sites_with_prof(i32 %a, i32 %b, i1 %flag, i1 %flag2) {
; CHECK: Printing analysis {{.*}} for function 'test_cold_call_sites_with_prof'		; CHECK: Printing analysis {{.*}} for function 'test_cold_call_sites_with_prof'
entry:		entry:
br i1 %flag, label %then, label %else		br i1 %flag, label %then, label %else
; CHECK: edge entry -> then probability is 0x07878788 / 0x80000000 = 5.88%		; CHECK: edge entry -> then probability is 0x07878788 / 0x80000000 = 5.88%
; CHECK: edge entry -> else probability is 0x78787878 / 0x80000000 = 94.12% [HOT edge]		; CHECK: edge entry -> else probability is 0x78787878 / 0x80000000 = 94.12% [HOT edge]
▲ Show 20 Lines • Show All 448 Lines • Show Last 20 Lines

llvm/test/Analysis/BranchProbabilityInfo/noreturn.ll

	Show First 20 Lines • Show All 73 Lines • ▼ Show 20 Lines
	abort:			abort:
	call void @abort() noreturn			call void @abort() noreturn
	unreachable			unreachable

	exit:			exit:
	ret i32 %b			ret i32 %b
	}			}

				define i32 @test4(i32 %a, i32 %b) {
				; CHECK: Printing analysis {{.*}} for function 'test4'
				; Make sure we handle loops post-dominated by unreachables.
				entry:
				%cond1 = icmp eq i32 %a, 42
				br i1 %cond1, label %header, label %exit
				; CHECK: edge entry -> header probability is 0x00000001 / 0x80000000 = 0.00%
				; CHECK: edge entry -> exit probability is 0x7fffffff / 0x80000000 = 100.00% [HOT edge]

				header:
				br label %body

				body:
				%cond2 = icmp eq i32 %a, 42
				br i1 %cond2, label %header, label %abort
				; CHECK: edge body -> header probability is 0x40000000 / 0x80000000 = 50.00%
				; CHECK: edge body -> abort probability is 0x40000000 / 0x80000000 = 50.00%

				abort:
				call void @abort() noreturn
				unreachable

				exit:
				ret i32 %b
				}

	@_ZTIi = external global i8*			@_ZTIi = external global i8*

	; CHECK-LABEL: throwSmallException			; CHECK-LABEL: throwSmallException
	; CHECK-NOT: invoke i32 @smallFunction			; CHECK-NOT: invoke i32 @smallFunction
	define i32 @throwSmallException(i32 %idx, i32 %limit) #0 personality i8* bitcast (i32 (...)* @__gxx_personality_v0 to i8*) {			define i32 @throwSmallException(i32 %idx, i32 %limit) #0 personality i8* bitcast (i32 (...)* @__gxx_personality_v0 to i8*) {
	entry:			entry:
	%cmp = icmp sge i32 %idx, %limit			%cmp = icmp sge i32 %idx, %limit
	br i1 %cmp, label %if.then, label %if.end			br i1 %cmp, label %if.then, label %if.end
	Show All 36 Lines

llvm/test/CodeGen/X86/block-placement.ll

	Show First 20 Lines • Show All 352 Lines • ▼ Show 20 Lines
	; Test that we can handle a loop with a nested natural loop and an unnatural			; Test that we can handle a loop with a nested natural loop and an unnatural
	; loop. This was reduced from a crash on block placement when run over			; loop. This was reduced from a crash on block placement when run over
	; single-source GCC.			; single-source GCC.
	; CHECK-LABEL: unnatural_cfg2			; CHECK-LABEL: unnatural_cfg2
	; CHECK: %entry			; CHECK: %entry
	; CHECK: %loop.header			; CHECK: %loop.header
	; CHECK: %loop.body1			; CHECK: %loop.body1
	; CHECK: %loop.body2			; CHECK: %loop.body2
				; CHECK: %loop.body3
				; CHECK: %loop.inner1.begin
	; CHECK: %loop.body4			; CHECK: %loop.body4
	; CHECK: %loop.inner2.begin			; CHECK: %loop.inner2.begin
	; CHECK: %loop.inner2.begin			; CHECK: %loop.inner2.begin
	; CHECK: %loop.body3
	; CHECK: %loop.inner1.begin
	; CHECK: %bail			; CHECK: %bail

	entry:			entry:
	br label %loop.header			br label %loop.header

	loop.header:			loop.header:
	%comp0 = icmp eq i32* %p0, null			%comp0 = icmp eq i32* %p0, null
	br i1 %comp0, label %bail, label %loop.body1			br i1 %comp0, label %bail, label %loop.body1
	▲ Show 20 Lines • Show All 1,229 Lines • Show Last 20 Lines

llvm/test/CodeGen/X86/pr37916.ll

	; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py			; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
	; RUN: llc -mtriple=i386-unknown-linux-gnu %s -o - \| FileCheck %s			; RUN: llc -mtriple=i386-unknown-linux-gnu %s -o - \| FileCheck %s

	@f = external local_unnamed_addr global i64*, align 4			@f = external local_unnamed_addr global i64*, align 4
	@a = external global i64, align 8			@a = external global i64, align 8

	define void @fn1() local_unnamed_addr {			define void @fn1() local_unnamed_addr {
	; CHECK-LABEL: fn1:			; CHECK-LABEL: fn1:
	; CHECK: # %bb.0: # %entry			; CHECK: # %bb.0: # %entry
	; CHECK-NEXT: .p2align 4, 0x90
	skatkovUnsubmitted Not Done Reply Inline Actions Why we lost this alignment? skatkov: Why we lost this alignment?
	; CHECK-NEXT: .LBB0_1: # %if.end			; CHECK-NEXT: .LBB0_1: # %if.end
	; CHECK-NEXT: # =>This Inner Loop Header: Depth=1			; CHECK-NEXT: # =>This Inner Loop Header: Depth=1
	; CHECK-NEXT: movl a+4, %eax			; CHECK-NEXT: movl a+4, %eax
	; CHECK-NEXT: orl a, %eax			; CHECK-NEXT: orl a, %eax
	; CHECK-NEXT: movl $a, f			; CHECK-NEXT: movl $a, f
	; CHECK-NEXT: je .LBB0_3			; CHECK-NEXT: je .LBB0_3
	; CHECK-NEXT: # %bb.2: # %if.end			; CHECK-NEXT: # %bb.2: # %if.end
	; CHECK-NEXT: # in Loop: Header=BB0_1 Depth=1			; CHECK-NEXT: # in Loop: Header=BB0_1 Depth=1
	Show All 26 Lines

llvm/test/CodeGen/X86/ragreedy-hoist-spill.ll

	; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py			; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
	; RUN: llc < %s -mtriple=x86_64-apple-macosx -regalloc=greedy \| FileCheck %s			; RUN: llc < %s -mtriple=x86_64-apple-macosx -regalloc=greedy \| FileCheck %s

	; This testing case is reduced from 254.gap SyFgets function.			; This testing case is reduced from 254.gap SyFgets function.
	; We make sure a spill is hoisted to a cold BB inside the hotter outer loop.			; We make sure a spill is hoisted to a cold BB inside the hotter outer loop.
				skatkovUnsubmitted Not Done Reply Inline Actions I have a trouble to detect whether the expected behavior of the test is still performed. Did you ensured in it or just re-generated the expected output? skatkov: I have a trouble to detect whether the expected behavior of the test is still performed. Did…

	%struct.TMP.1 = type { %struct.TMP.2, %struct.TMP.2, [1024 x i8] }			%struct.TMP.1 = type { %struct.TMP.2, %struct.TMP.2, [1024 x i8] }
	%struct.TMP.2 = type { i8, i32, i32, i16, i16, %struct.TMP.3, i32, i8, i32 (i8), i32 (i8, i8, i32), i64 (i8, i64, i32), i32 (i8, i8, i32), %struct.TMP.3, %struct.TMP.4*, i32, [3 x i8], [1 x i8], %struct.TMP.3, i32, i64 }			%struct.TMP.2 = type { i8, i32, i32, i16, i16, %struct.TMP.3, i32, i8, i32 (i8), i32 (i8, i8, i32), i64 (i8, i64, i32), i32 (i8, i8, i32), %struct.TMP.3, %struct.TMP.4*, i32, [3 x i8], [1 x i8], %struct.TMP.3, i32, i64 }
	%struct.TMP.4 = type opaque			%struct.TMP.4 = type opaque
	%struct.TMP.3 = type { i8*, i32 }			%struct.TMP.3 = type { i8*, i32 }

	@syBuf = external global [16 x %struct.TMP.1], align 16			@syBuf = external global [16 x %struct.TMP.1], align 16
	@syHistory = external global [8192 x i8], align 16			@syHistory = external global [8192 x i8], align 16
	Show All 10 Lines
	; CHECK-NEXT: pushq %r14			; CHECK-NEXT: pushq %r14
	; CHECK-NEXT: .cfi_def_cfa_offset 32			; CHECK-NEXT: .cfi_def_cfa_offset 32
	; CHECK-NEXT: pushq %r13			; CHECK-NEXT: pushq %r13
	; CHECK-NEXT: .cfi_def_cfa_offset 40			; CHECK-NEXT: .cfi_def_cfa_offset 40
	; CHECK-NEXT: pushq %r12			; CHECK-NEXT: pushq %r12
	; CHECK-NEXT: .cfi_def_cfa_offset 48			; CHECK-NEXT: .cfi_def_cfa_offset 48
	; CHECK-NEXT: pushq %rbx			; CHECK-NEXT: pushq %rbx
	; CHECK-NEXT: .cfi_def_cfa_offset 56			; CHECK-NEXT: .cfi_def_cfa_offset 56
	; CHECK-NEXT: subq $536, %rsp ## imm = 0x218			; CHECK-NEXT: subq $552, %rsp ## imm = 0x228
	; CHECK-NEXT: .cfi_def_cfa_offset 592			; CHECK-NEXT: .cfi_def_cfa_offset 608
	; CHECK-NEXT: .cfi_offset %rbx, -56			; CHECK-NEXT: .cfi_offset %rbx, -56
	; CHECK-NEXT: .cfi_offset %r12, -48			; CHECK-NEXT: .cfi_offset %r12, -48
	; CHECK-NEXT: .cfi_offset %r13, -40			; CHECK-NEXT: .cfi_offset %r13, -40
	; CHECK-NEXT: .cfi_offset %r14, -32			; CHECK-NEXT: .cfi_offset %r14, -32
	; CHECK-NEXT: .cfi_offset %r15, -24			; CHECK-NEXT: .cfi_offset %r15, -24
	; CHECK-NEXT: .cfi_offset %rbp, -16			; CHECK-NEXT: .cfi_offset %rbp, -16
	; CHECK-NEXT: movq %rdx, %rax			; CHECK-NEXT: movq %rdx, %rax
	; CHECK-NEXT: orq $2, %rax			; CHECK-NEXT: orq $2, %rax
	; CHECK-NEXT: cmpq $2, %rax			; CHECK-NEXT: cmpq $2, %rax
	; CHECK-NEXT: jne LBB0_4			; CHECK-NEXT: jne LBB0_4
	; CHECK-NEXT: ## %bb.1: ## %if.end			; CHECK-NEXT: ## %bb.1: ## %if.end
	; CHECK-NEXT: xorl %eax, %eax			; CHECK-NEXT: xorl %eax, %eax
	; CHECK-NEXT: testb %al, %al			; CHECK-NEXT: testb %al, %al
	; CHECK-NEXT: jne LBB0_5			; CHECK-NEXT: jne LBB0_5
	; CHECK-NEXT: ## %bb.2: ## %if.then4			; CHECK-NEXT: ## %bb.2: ## %if.then4
	; CHECK-NEXT: xorl %eax, %eax			; CHECK-NEXT: xorl %eax, %eax
	; CHECK-NEXT: testb %al, %al			; CHECK-NEXT: testb %al, %al
	; CHECK-NEXT: je LBB0_55			; CHECK-NEXT: je LBB0_55
	; CHECK-NEXT: ## %bb.3: ## %SyTime.exit			; CHECK-NEXT: ## %bb.3: ## %SyTime.exit
	; CHECK-NEXT: xorl %eax, %eax			; CHECK-NEXT: xorl %eax, %eax
	; CHECK-NEXT: testb %al, %al			; CHECK-NEXT: testb %al, %al
	; CHECK-NEXT: je LBB0_55			; CHECK-NEXT: je LBB0_55
	; CHECK-NEXT: LBB0_4: ## %cleanup			; CHECK-NEXT: LBB0_4: ## %cleanup
	; CHECK-NEXT: addq $536, %rsp ## imm = 0x218			; CHECK-NEXT: addq $552, %rsp ## imm = 0x228
	; CHECK-NEXT: popq %rbx			; CHECK-NEXT: popq %rbx
	; CHECK-NEXT: popq %r12			; CHECK-NEXT: popq %r12
	; CHECK-NEXT: popq %r13			; CHECK-NEXT: popq %r13
	; CHECK-NEXT: popq %r14			; CHECK-NEXT: popq %r14
	; CHECK-NEXT: popq %r15			; CHECK-NEXT: popq %r15
	; CHECK-NEXT: popq %rbp			; CHECK-NEXT: popq %rbp
	; CHECK-NEXT: retq			; CHECK-NEXT: retq
	; CHECK-NEXT: LBB0_5: ## %if.end25			; CHECK-NEXT: LBB0_5: ## %if.end25
	; CHECK-NEXT: xorl %eax, %eax			; CHECK-NEXT: xorl %eax, %eax
	; CHECK-NEXT: testb %al, %al			; CHECK-NEXT: testb %al, %al
	; CHECK-NEXT: je LBB0_55			; CHECK-NEXT: je LBB0_55
	; CHECK-NEXT: ## %bb.6: ## %SyTime.exit2720			; CHECK-NEXT: ## %bb.6: ## %SyTime.exit2720
	; CHECK-NEXT: movq %rdx, %rbx			; CHECK-NEXT: movq %rdx, %rbx
	; CHECK-NEXT: movq %rdi, %rbp			; CHECK-NEXT: movq %rdi, %r14
	; CHECK-NEXT: leaq {{[0-9]+}}(%rsp), %rax			; CHECK-NEXT: leaq {{[0-9]+}}(%rsp), %rax
	; CHECK-NEXT: leaq {{[0-9]+}}(%rsp), %rcx			; CHECK-NEXT: leaq {{[0-9]+}}(%rsp), %rcx
	; CHECK-NEXT: cmpq %rax, %rcx			; CHECK-NEXT: cmpq %rax, %rcx
	; CHECK-NEXT: jae LBB0_8			; CHECK-NEXT: jae LBB0_8
	; CHECK-NEXT: ## %bb.7: ## %for.body.lr.ph			; CHECK-NEXT: ## %bb.7: ## %for.body.lr.ph
	; CHECK-NEXT: movl $512, %edx ## imm = 0x200			; CHECK-NEXT: movl $512, %edx ## imm = 0x200
	; CHECK-NEXT: movl $32, %esi			; CHECK-NEXT: movl $32, %esi
	; CHECK-NEXT: callq _memset			; CHECK-NEXT: callq _memset
	; CHECK-NEXT: LBB0_8: ## %while.body.preheader			; CHECK-NEXT: LBB0_8: ## %while.body.preheader
	; CHECK-NEXT: movq %rbp, {{[-0-9]+}}(%r{{[sb]}}p) ## 8-byte Spill
	; CHECK-NEXT: imulq $1040, %rbx, %rax ## imm = 0x410			; CHECK-NEXT: imulq $1040, %rbx, %rax ## imm = 0x410
	; CHECK-NEXT: movq _syBuf@{{.*}}(%rip), %rcx			; CHECK-NEXT: movq _syBuf@{{.*}}(%rip), %rcx
	; CHECK-NEXT: leaq 8(%rcx,%rax), %rbx			; CHECK-NEXT: leaq 8(%rcx,%rax), %rax
				; CHECK-NEXT: movq %rax, {{[-0-9]+}}(%r{{[sb]}}p) ## 8-byte Spill
	; CHECK-NEXT: movl $1, %r15d			; CHECK-NEXT: movl $1, %r15d
	; CHECK-NEXT: movq _syCTRO@{{.*}}(%rip), %rax			; CHECK-NEXT: movq _syCTRO@{{.*}}(%rip), %rax
	; CHECK-NEXT: movb $1, %cl			; CHECK-NEXT: movb $1, %cl
	; CHECK-NEXT: .p2align 4, 0x90			; CHECK-NEXT: .p2align 4, 0x90
	; CHECK-NEXT: LBB0_9: ## %do.body			; CHECK-NEXT: LBB0_9: ## %do.body
	; CHECK-NEXT: ## =>This Inner Loop Header: Depth=1			; CHECK-NEXT: ## =>This Inner Loop Header: Depth=1
	; CHECK-NEXT: movl $0, (%rax)			; CHECK-NEXT: movl $0, (%rax)
	; CHECK-NEXT: testb %cl, %cl			; CHECK-NEXT: testb %cl, %cl
	; CHECK-NEXT: jne LBB0_9			; CHECK-NEXT: jne LBB0_9
	; CHECK-NEXT: ## %bb.10: ## %do.end			; CHECK-NEXT: ## %bb.10: ## %do.end
	; CHECK-NEXT: xorl %r14d, %r14d			; CHECK-NEXT: xorl %ebp, %ebp
	; CHECK-NEXT: testb %r14b, %r14b			; CHECK-NEXT: testb %bpl, %bpl
	; CHECK-NEXT: jne LBB0_11			; CHECK-NEXT: jne LBB0_11
	; CHECK-NEXT: ## %bb.12: ## %while.body200.preheader			; CHECK-NEXT: ## %bb.12: ## %while.body200.preheader
	; CHECK-NEXT: xorl %edx, %edx			; CHECK-NEXT: xorl %ebx, %ebx
	; CHECK-NEXT: leaq {{.*}}(%rip), %rsi			; CHECK-NEXT: leaq {{.*}}(%rip), %r13
	; CHECK-NEXT: leaq {{.*}}(%rip), %rdi			; CHECK-NEXT: movl $0, {{[-0-9]+}}(%r{{[sb]}}p) ## 4-byte Folded Spill
	; CHECK-NEXT: xorl %ebp, %ebp			; CHECK-NEXT: xorl %r12d, %r12d
	; CHECK-NEXT: xorl %r13d, %r13d			; CHECK-NEXT: movq %r14, {{[-0-9]+}}(%r{{[sb]}}p) ## 8-byte Spill
	; CHECK-NEXT: jmp LBB0_13			; CHECK-NEXT: jmp LBB0_13
	; CHECK-NEXT: .p2align 4, 0x90			; CHECK-NEXT: .p2align 4, 0x90
	; CHECK-NEXT: LBB0_20: ## %sw.bb256			; CHECK-NEXT: LBB0_20: ## %sw.bb256
	; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1			; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1
	; CHECK-NEXT: movl %r14d, %r13d			; CHECK-NEXT: movl %ebp, %r12d
	; CHECK-NEXT: LBB0_21: ## %while.cond197.backedge			; CHECK-NEXT: LBB0_21: ## %while.cond197.backedge
	; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1			; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1
	; CHECK-NEXT: decl %r15d			; CHECK-NEXT: decl %r15d
	; CHECK-NEXT: testl %r15d, %r15d			; CHECK-NEXT: testl %r15d, %r15d
	; CHECK-NEXT: movl %r13d, %r14d			; CHECK-NEXT: movl %r12d, %ebp
	; CHECK-NEXT: jle LBB0_22			; CHECK-NEXT: jle LBB0_22
	; CHECK-NEXT: LBB0_13: ## %while.body200			; CHECK-NEXT: LBB0_13: ## %while.body200
	; CHECK-NEXT: ## =>This Loop Header: Depth=1			; CHECK-NEXT: ## =>This Loop Header: Depth=1
	; CHECK-NEXT: ## Child Loop BB0_30 Depth 2			; CHECK-NEXT: ## Child Loop BB0_30 Depth 2
	; CHECK-NEXT: ## Child Loop BB0_38 Depth 2			; CHECK-NEXT: ## Child Loop BB0_38 Depth 2
	; CHECK-NEXT: leal -268(%r14), %eax			; CHECK-NEXT: leal -268(%rbp), %eax
	; CHECK-NEXT: cmpl $105, %eax			; CHECK-NEXT: cmpl $105, %eax
	; CHECK-NEXT: ja LBB0_14			; CHECK-NEXT: ja LBB0_14
	; CHECK-NEXT: ## %bb.56: ## %while.body200			; CHECK-NEXT: ## %bb.56: ## %while.body200
	; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1			; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1
	; CHECK-NEXT: movslq (%rdi,%rax,4), %rax			; CHECK-NEXT: movslq (%r13,%rax,4), %rax
	; CHECK-NEXT: addq %rdi, %rax			; CHECK-NEXT: addq %r13, %rax
	; CHECK-NEXT: jmpq *%rax			; CHECK-NEXT: jmpq *%rax
	; CHECK-NEXT: LBB0_44: ## %while.cond1037.preheader			; CHECK-NEXT: LBB0_44: ## %while.cond1037.preheader
	; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1			; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1
	; CHECK-NEXT: testb %dl, %dl			; CHECK-NEXT: testb %bl, %bl
	; CHECK-NEXT: movl %r14d, %r13d			; CHECK-NEXT: movl %ebp, %r12d
	; CHECK-NEXT: jne LBB0_21			; CHECK-NEXT: jne LBB0_21
	; CHECK-NEXT: jmp LBB0_55			; CHECK-NEXT: jmp LBB0_55
	; CHECK-NEXT: .p2align 4, 0x90			; CHECK-NEXT: .p2align 4, 0x90
	; CHECK-NEXT: LBB0_14: ## %while.body200			; CHECK-NEXT: LBB0_14: ## %while.body200
	; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1			; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1
	; CHECK-NEXT: leal 1(%r14), %eax			; CHECK-NEXT: leal 1(%rbp), %eax
	; CHECK-NEXT: cmpl $21, %eax			; CHECK-NEXT: cmpl $21, %eax
	; CHECK-NEXT: ja LBB0_20			; CHECK-NEXT: ja LBB0_20
	; CHECK-NEXT: ## %bb.15: ## %while.body200			; CHECK-NEXT: ## %bb.15: ## %while.body200
	; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1			; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1
	; CHECK-NEXT: movl $-1, %r13d			; CHECK-NEXT: movl $-1, %r12d
	; CHECK-NEXT: movslq (%rsi,%rax,4), %rax			; CHECK-NEXT: leaq {{.*}}(%rip), %rcx
	; CHECK-NEXT: addq %rsi, %rax			; CHECK-NEXT: movslq (%rcx,%rax,4), %rax
				; CHECK-NEXT: addq %rcx, %rax
	; CHECK-NEXT: jmpq *%rax			; CHECK-NEXT: jmpq *%rax
	; CHECK-NEXT: LBB0_18: ## %while.cond201.preheader			; CHECK-NEXT: LBB0_18: ## %while.cond201.preheader
	; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1			; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1
	; CHECK-NEXT: movl $1, %r13d			; CHECK-NEXT: movl $1, %r12d
	; CHECK-NEXT: jmp LBB0_21			; CHECK-NEXT: jmp LBB0_21
	; CHECK-NEXT: LBB0_26: ## %sw.bb474			; CHECK-NEXT: LBB0_26: ## %sw.bb474
	; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1			; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1
	; CHECK-NEXT: testb %dl, %dl			; CHECK-NEXT: testb %bl, %bl
	; CHECK-NEXT: ## implicit-def: $r12			; CHECK-NEXT: ## implicit-def: $r14
	; CHECK-NEXT: jne LBB0_34			; CHECK-NEXT: jne LBB0_34
	; CHECK-NEXT: ## %bb.27: ## %do.body479.preheader			; CHECK-NEXT: ## %bb.27: ## %do.body479.preheader
	; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1			; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1
	; CHECK-NEXT: testb %dl, %dl			; CHECK-NEXT: testb %bl, %bl
	; CHECK-NEXT: ## implicit-def: $r12			; CHECK-NEXT: ## implicit-def: $r14
	; CHECK-NEXT: jne LBB0_34			; CHECK-NEXT: jne LBB0_34
	; CHECK-NEXT: ## %bb.28: ## %land.rhs485.preheader			; CHECK-NEXT: ## %bb.28: ## %land.rhs485.preheader
	; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1			; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1
	; CHECK-NEXT: ## implicit-def: $rax			; CHECK-NEXT: ## implicit-def: $rax
	; CHECK-NEXT: testb %al, %al			; CHECK-NEXT: testb %al, %al
	; CHECK-NEXT: jns LBB0_30			; CHECK-NEXT: jns LBB0_30
	; CHECK-NEXT: jmp LBB0_55			; CHECK-NEXT: jmp LBB0_55
	; CHECK-NEXT: .p2align 4, 0x90			; CHECK-NEXT: .p2align 4, 0x90
	; CHECK-NEXT: LBB0_32: ## %do.body479.backedge			; CHECK-NEXT: LBB0_32: ## %do.body479.backedge
	; CHECK-NEXT: ## in Loop: Header=BB0_30 Depth=2			; CHECK-NEXT: ## in Loop: Header=BB0_30 Depth=2
	; CHECK-NEXT: leaq 1(%r12), %rax			; CHECK-NEXT: leaq 1(%r14), %rax
	; CHECK-NEXT: testb %dl, %dl			; CHECK-NEXT: testb %bl, %bl
	; CHECK-NEXT: je LBB0_33			; CHECK-NEXT: je LBB0_33
	; CHECK-NEXT: ## %bb.29: ## %land.rhs485			; CHECK-NEXT: ## %bb.29: ## %land.rhs485
	; CHECK-NEXT: ## in Loop: Header=BB0_30 Depth=2			; CHECK-NEXT: ## in Loop: Header=BB0_30 Depth=2
	; CHECK-NEXT: testb %al, %al			; CHECK-NEXT: testb %al, %al
	; CHECK-NEXT: js LBB0_55			; CHECK-NEXT: js LBB0_55
	; CHECK-NEXT: LBB0_30: ## %cond.true.i.i2780			; CHECK-NEXT: LBB0_30: ## %cond.true.i.i2780
	; CHECK-NEXT: ## Parent Loop BB0_13 Depth=1			; CHECK-NEXT: ## Parent Loop BB0_13 Depth=1
	; CHECK-NEXT: ## => This Inner Loop Header: Depth=2			; CHECK-NEXT: ## => This Inner Loop Header: Depth=2
	; CHECK-NEXT: movq %rax, %r12			; CHECK-NEXT: movq %rax, %r14
	; CHECK-NEXT: testb %dl, %dl			; CHECK-NEXT: testb %bl, %bl
	; CHECK-NEXT: jne LBB0_32			; CHECK-NEXT: jne LBB0_32
	; CHECK-NEXT: ## %bb.31: ## %lor.rhs500			; CHECK-NEXT: ## %bb.31: ## %lor.rhs500
	; CHECK-NEXT: ## in Loop: Header=BB0_30 Depth=2			; CHECK-NEXT: ## in Loop: Header=BB0_30 Depth=2
	; CHECK-NEXT: movl $256, %esi ## imm = 0x100			; CHECK-NEXT: movl $256, %esi ## imm = 0x100
	; CHECK-NEXT: callq ___maskrune			; CHECK-NEXT: callq ___maskrune
	; CHECK-NEXT: xorl %edx, %edx			; CHECK-NEXT: testb %bl, %bl
	; CHECK-NEXT: testb %dl, %dl
	; CHECK-NEXT: jne LBB0_32			; CHECK-NEXT: jne LBB0_32
	; CHECK-NEXT: jmp LBB0_34			; CHECK-NEXT: jmp LBB0_34
	; CHECK-NEXT: LBB0_45: ## %sw.bb1134			; CHECK-NEXT: LBB0_45: ## %sw.bb1134
	; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1			; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1
	; CHECK-NEXT: leaq {{[0-9]+}}(%rsp), %rax			; CHECK-NEXT: leaq {{[0-9]+}}(%rsp), %rax
	; CHECK-NEXT: leaq {{[0-9]+}}(%rsp), %rcx			; CHECK-NEXT: leaq {{[0-9]+}}(%rsp), %rcx
	; CHECK-NEXT: cmpq %rax, %rcx			; CHECK-NEXT: cmpq %rax, %rcx
	; CHECK-NEXT: jb LBB0_55			; CHECK-NEXT: jb LBB0_55
	; CHECK-NEXT: ## %bb.46: ## in Loop: Header=BB0_13 Depth=1			; CHECK-NEXT: ## %bb.46: ## in Loop: Header=BB0_13 Depth=1
	; CHECK-NEXT: xorl %ebp, %ebp			; CHECK-NEXT: movl $0, {{[-0-9]+}}(%r{{[sb]}}p) ## 4-byte Folded Spill
	; CHECK-NEXT: movl $268, %r13d ## imm = 0x10C			; CHECK-NEXT: movl $268, %r12d ## imm = 0x10C
	; CHECK-NEXT: jmp LBB0_21			; CHECK-NEXT: jmp LBB0_21
	; CHECK-NEXT: LBB0_19: ## %sw.bb243			; CHECK-NEXT: LBB0_40: ## %sw.bb566
	; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1			; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1
	; CHECK-NEXT: movl $2, %r13d			; CHECK-NEXT: movl $20, %r12d
	; CHECK-NEXT: jmp LBB0_21			; CHECK-NEXT: jmp LBB0_21
	; CHECK-NEXT: LBB0_40: ## %sw.bb566			; CHECK-NEXT: LBB0_19: ## %sw.bb243
	; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1			; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1
	; CHECK-NEXT: movl $20, %r13d			; CHECK-NEXT: movl $2, %r12d
	; CHECK-NEXT: jmp LBB0_21			; CHECK-NEXT: jmp LBB0_21
	; CHECK-NEXT: LBB0_33: ## %if.end517.loopexitsplit			; CHECK-NEXT: LBB0_33: ## %if.end517.loopexitsplit
	; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1			; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1
	; CHECK-NEXT: incq %r12			; CHECK-NEXT: incq %r14
	; CHECK-NEXT: LBB0_34: ## %if.end517			; CHECK-NEXT: LBB0_34: ## %if.end517
	; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1			; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1
	; CHECK-NEXT: leal -324(%r13), %eax			; CHECK-NEXT: leal -324(%r12), %eax
	; CHECK-NEXT: cmpl $59, %eax			; CHECK-NEXT: cmpl $59, %eax
	; CHECK-NEXT: ja LBB0_35			; CHECK-NEXT: ja LBB0_35
	; CHECK-NEXT: ## %bb.57: ## %if.end517			; CHECK-NEXT: ## %bb.57: ## %if.end517
	; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1			; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1
	; CHECK-NEXT: movabsq $576460756598390785, %rcx ## imm = 0x800000100000001			; CHECK-NEXT: movabsq $576460756598390785, %rcx ## imm = 0x800000100000001
	; CHECK-NEXT: btq %rax, %rcx			; CHECK-NEXT: btq %rax, %rcx
	; CHECK-NEXT: jb LBB0_38			; CHECK-NEXT: jb LBB0_38
	; CHECK-NEXT: LBB0_35: ## %if.end517			; CHECK-NEXT: LBB0_35: ## %if.end517
	; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1			; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1
	; CHECK-NEXT: cmpl $11, %r13d			; CHECK-NEXT: cmpl $11, %r12d
	; CHECK-NEXT: je LBB0_38			; CHECK-NEXT: je LBB0_38
	; CHECK-NEXT: ## %bb.36: ## %if.end517			; CHECK-NEXT: ## %bb.36: ## %if.end517
	; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1			; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1
	; CHECK-NEXT: cmpl $24, %r13d			; CHECK-NEXT: cmpl $24, %r12d
	; CHECK-NEXT: je LBB0_38			; CHECK-NEXT: je LBB0_38
	; CHECK-NEXT: ## %bb.37: ## %if.then532			; CHECK-NEXT: ## %bb.37: ## %if.then532
	; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1			; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1
	; CHECK-NEXT: movq _SyFgets.yank@{{.*}}(%rip), %rax			; CHECK-NEXT: movq _SyFgets.yank@{{.*}}(%rip), %rax
	; CHECK-NEXT: movb $0, (%rax)			; CHECK-NEXT: movb $0, (%rax)
	; CHECK-NEXT: .p2align 4, 0x90			; CHECK-NEXT: .p2align 4, 0x90
	; CHECK-NEXT: LBB0_38: ## %for.cond534			; CHECK-NEXT: LBB0_38: ## %for.cond534
	; CHECK-NEXT: ## Parent Loop BB0_13 Depth=1			; CHECK-NEXT: ## Parent Loop BB0_13 Depth=1
	; CHECK-NEXT: ## => This Inner Loop Header: Depth=2			; CHECK-NEXT: ## => This Inner Loop Header: Depth=2
	; CHECK-NEXT: testb %dl, %dl			; CHECK-NEXT: testb %bl, %bl
	; CHECK-NEXT: jne LBB0_38			; CHECK-NEXT: jne LBB0_38
	; CHECK-NEXT: ## %bb.39: ## %for.cond542.preheader			; CHECK-NEXT: ## %bb.39: ## %for.cond542.preheader
	; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1			; CHECK-NEXT: ## in Loop: Header=BB0_13 Depth=1
	; CHECK-NEXT: testb %dl, %dl			; CHECK-NEXT: testb %bl, %bl
	; CHECK-NEXT: movb $0, (%r12)			; CHECK-NEXT: movb $0, (%r14)
	; CHECK-NEXT: movl %r14d, %r13d			; CHECK-NEXT: movl %ebp, %r12d
	; CHECK-NEXT: leaq {{.*}}(%rip), %rsi			; CHECK-NEXT: movq {{[-0-9]+}}(%r{{[sb]}}p), %r14 ## 8-byte Reload
	; CHECK-NEXT: leaq {{.*}}(%rip), %rdi
	; CHECK-NEXT: jmp LBB0_21			; CHECK-NEXT: jmp LBB0_21
	; CHECK-NEXT: .p2align 4, 0x90			; CHECK-NEXT: .p2align 4, 0x90
	; CHECK-NEXT: LBB0_42: ## %while.cond864			; CHECK-NEXT: LBB0_42: ## %while.cond864
	; CHECK-NEXT: ## =>This Inner Loop Header: Depth=1			; CHECK-NEXT: ## =>This Inner Loop Header: Depth=1
	; CHECK-NEXT: jmp LBB0_42			; CHECK-NEXT: jmp LBB0_42
	; CHECK-NEXT: .p2align 4, 0x90			; CHECK-NEXT: .p2align 4, 0x90
	; CHECK-NEXT: LBB0_43: ## %while.cond962			; CHECK-NEXT: LBB0_43: ## %while.cond962
	; CHECK-NEXT: ## =>This Inner Loop Header: Depth=1			; CHECK-NEXT: ## =>This Inner Loop Header: Depth=1
	; CHECK-NEXT: jmp LBB0_43			; CHECK-NEXT: jmp LBB0_43
	; CHECK-NEXT: .p2align 4, 0x90			; CHECK-NEXT: .p2align 4, 0x90
	; CHECK-NEXT: LBB0_25: ## %for.cond357			; CHECK-NEXT: LBB0_25: ## %for.cond357
	; CHECK-NEXT: ## =>This Inner Loop Header: Depth=1			; CHECK-NEXT: ## =>This Inner Loop Header: Depth=1
	; CHECK-NEXT: jmp LBB0_25			; CHECK-NEXT: jmp LBB0_25
	; CHECK-NEXT: LBB0_11:			; CHECK-NEXT: LBB0_11:
	; CHECK-NEXT: xorl %ebp, %ebp			; CHECK-NEXT: movl $0, {{[-0-9]+}}(%r{{[sb]}}p) ## 4-byte Folded Spill
	; CHECK-NEXT: xorl %r13d, %r13d			; CHECK-NEXT: xorl %r12d, %r12d
	; CHECK-NEXT: LBB0_22: ## %while.end1465			; CHECK-NEXT: LBB0_22: ## %while.end1465
	; CHECK-NEXT: incl %r13d			; CHECK-NEXT: incl %r12d
	; CHECK-NEXT: cmpl $16, %r13d			; CHECK-NEXT: cmpl $16, %r12d
	; CHECK-NEXT: ja LBB0_50			; CHECK-NEXT: ja LBB0_50
	; CHECK-NEXT: ## %bb.23: ## %while.end1465			; CHECK-NEXT: ## %bb.23: ## %while.end1465
	; CHECK-NEXT: movl $83969, %eax ## imm = 0x14801			; CHECK-NEXT: movl $83969, %eax ## imm = 0x14801
	; CHECK-NEXT: btl %r13d, %eax			; CHECK-NEXT: btl %r12d, %eax
	; CHECK-NEXT: jae LBB0_50			; CHECK-NEXT: jae LBB0_50
	; CHECK-NEXT: ## %bb.24:			; CHECK-NEXT: ## %bb.24:
	; CHECK-NEXT: xorl %ebp, %ebp			; CHECK-NEXT: xorl %ebx, %ebx
	; CHECK-NEXT: movq {{[-0-9]+}}(%r{{[sb]}}p), %rbx ## 8-byte Reload
	; CHECK-NEXT: LBB0_48: ## %if.then1477			; CHECK-NEXT: LBB0_48: ## %if.then1477
	; CHECK-NEXT: movl $1, %edx			; CHECK-NEXT: movl $1, %edx
	; CHECK-NEXT: callq _write			; CHECK-NEXT: callq _write
	; CHECK-NEXT: subq %rbp, %rbx			; CHECK-NEXT: subq %rbx, %r14
	; CHECK-NEXT: movq _syHistory@{{.*}}(%rip), %rax			; CHECK-NEXT: movq _syHistory@{{.*}}(%rip), %rax
	; CHECK-NEXT: leaq 8189(%rbx,%rax), %rax			; CHECK-NEXT: leaq 8189(%r14,%rax), %rax
	; CHECK-NEXT: .p2align 4, 0x90			; CHECK-NEXT: .p2align 4, 0x90
	; CHECK-NEXT: LBB0_49: ## %for.body1723			; CHECK-NEXT: LBB0_49: ## %for.body1723
	; CHECK-NEXT: ## =>This Inner Loop Header: Depth=1			; CHECK-NEXT: ## =>This Inner Loop Header: Depth=1
	; CHECK-NEXT: decq %rax			; CHECK-NEXT: decq %rax
	; CHECK-NEXT: jmp LBB0_49			; CHECK-NEXT: jmp LBB0_49
				; CHECK-NEXT: LBB0_47: ## %if.then1477.loopexit
				; CHECK-NEXT: movq %r14, %rbx
				; CHECK-NEXT: jmp LBB0_48
				; CHECK-NEXT: LBB0_16: ## %while.cond635.preheader
				; CHECK-NEXT: xorl %eax, %eax
				; CHECK-NEXT: testb %al, %al
				; CHECK-NEXT: je LBB0_41
				; CHECK-NEXT: .p2align 4, 0x90
				; CHECK-NEXT: LBB0_17: ## %for.body643.us
				; CHECK-NEXT: ## =>This Inner Loop Header: Depth=1
				; CHECK-NEXT: jmp LBB0_17
				; CHECK-NEXT: .p2align 4, 0x90
				; CHECK-NEXT: LBB0_41: ## %while.cond661
				; CHECK-NEXT: ## =>This Inner Loop Header: Depth=1
				; CHECK-NEXT: jmp LBB0_41
	; CHECK-NEXT: LBB0_50: ## %for.cond1480.preheader			; CHECK-NEXT: LBB0_50: ## %for.cond1480.preheader
	; CHECK-NEXT: movl $512, %eax ## imm = 0x200			; CHECK-NEXT: movl $512, %eax ## imm = 0x200
	; CHECK-NEXT: cmpq %rax, %rax			; CHECK-NEXT: cmpq %rax, %rax
	; CHECK-NEXT: jae LBB0_55			; CHECK-NEXT: jae LBB0_55
	; CHECK-NEXT: ## %bb.51: ## %for.body1664.lr.ph			; CHECK-NEXT: ## %bb.51: ## %for.body1664.lr.ph
	; CHECK-NEXT: xorl %eax, %eax			; CHECK-NEXT: xorl %eax, %eax
	; CHECK-NEXT: testb %al, %al			; CHECK-NEXT: testb %al, %al
	; CHECK-NEXT: jne LBB0_54			; CHECK-NEXT: jne LBB0_54
	; CHECK-NEXT: ## %bb.52: ## %while.body1679.preheader			; CHECK-NEXT: ## %bb.52: ## %while.body1679.preheader
	; CHECK-NEXT: incl %ebp			; CHECK-NEXT: incl {{[-0-9]+}}(%r{{[sb]}}p) ## 4-byte Folded Spill
	; CHECK-NEXT: .p2align 4, 0x90
	; CHECK-NEXT: LBB0_53: ## %while.body1679			; CHECK-NEXT: LBB0_53: ## %while.body1679
	; CHECK-NEXT: ## =>This Inner Loop Header: Depth=1			; CHECK-NEXT: ## =>This Inner Loop Header: Depth=1
	; CHECK-NEXT: movq (%rbx), %rdi			; CHECK-NEXT: movq {{[-0-9]+}}(%r{{[sb]}}p), %rax ## 8-byte Reload
				; CHECK-NEXT: movq (%rax), %rdi
	; CHECK-NEXT: callq _fileno			; CHECK-NEXT: callq _fileno
	; CHECK-NEXT: movslq %ebp, %rax			; CHECK-NEXT: movslq {{[-0-9]+}}(%r{{[sb]}}p), %rax ## 4-byte Folded Reload
	; CHECK-NEXT: leal 1(%rax), %ebp			; CHECK-NEXT: leal 1(%rax), %ecx
				; CHECK-NEXT: movl %ecx, {{[-0-9]+}}(%r{{[sb]}}p) ## 4-byte Spill
	; CHECK-NEXT: cmpq %rax, %rax			; CHECK-NEXT: cmpq %rax, %rax
	; CHECK-NEXT: jl LBB0_53			; CHECK-NEXT: jl LBB0_53
	; CHECK-NEXT: LBB0_54: ## %while.cond1683.preheader			; CHECK-NEXT: LBB0_54: ## %while.cond1683.preheader
	; CHECK-NEXT: xorl %eax, %eax			; CHECK-NEXT: xorl %eax, %eax
	; CHECK-NEXT: testb %al, %al			; CHECK-NEXT: testb %al, %al
	; CHECK-NEXT: LBB0_55: ## %if.then.i			; CHECK-NEXT: LBB0_55: ## %if.then.i
	; CHECK-NEXT: ud2			; CHECK-NEXT: ud2
	; CHECK-NEXT: LBB0_47: ## %if.then1477.loopexit
	; CHECK-NEXT: movq {{[-0-9]+}}(%r{{[sb]}}p), %rbx ## 8-byte Reload
	; CHECK-NEXT: movq %rbx, %rbp
	; CHECK-NEXT: jmp LBB0_48
	; CHECK-NEXT: LBB0_16: ## %while.cond635.preheader
	; CHECK-NEXT: xorl %eax, %eax
	; CHECK-NEXT: testb %al, %al
	; CHECK-NEXT: je LBB0_41
	; CHECK-NEXT: .p2align 4, 0x90
	; CHECK-NEXT: LBB0_17: ## %for.body643.us
	; CHECK-NEXT: ## =>This Inner Loop Header: Depth=1
	; CHECK-NEXT: jmp LBB0_17
	; CHECK-NEXT: .p2align 4, 0x90
	; CHECK-NEXT: LBB0_41: ## %while.cond661
	; CHECK-NEXT: ## =>This Inner Loop Header: Depth=1
	; CHECK-NEXT: jmp LBB0_41
	entry:			entry:
	%sub.ptr.rhs.cast646 = ptrtoint i8* %line to i64			%sub.ptr.rhs.cast646 = ptrtoint i8* %line to i64
	%old = alloca [512 x i8], align 16			%old = alloca [512 x i8], align 16
	%0 = getelementptr inbounds [512 x i8], [512 x i8]* %old, i64 0, i64 0			%0 = getelementptr inbounds [512 x i8], [512 x i8]* %old, i64 0, i64 0
	switch i64 %fid, label %if.then [			switch i64 %fid, label %if.then [
	i64 2, label %if.end			i64 2, label %if.end
	i64 0, label %if.end			i64 0, label %if.end
	]			]
	▲ Show 20 Lines • Show All 361 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[BPI] Improve unreachable/ColdCall heurstics to handle loops.
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 229873

llvm/include/llvm/Analysis/BranchProbabilityInfo.h

llvm/lib/Analysis/BranchProbabilityInfo.cpp

llvm/test/Analysis/BranchProbabilityInfo/basic.ll

llvm/test/Analysis/BranchProbabilityInfo/noreturn.ll

llvm/test/CodeGen/X86/block-placement.ll

llvm/test/CodeGen/X86/pr37916.ll

llvm/test/CodeGen/X86/ragreedy-hoist-spill.ll

This is an archive of the discontinued LLVM Phabricator instance.

[BPI] Improve unreachable/ColdCall heurstics to handle loops.ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 229873

llvm/include/llvm/Analysis/BranchProbabilityInfo.h

llvm/lib/Analysis/BranchProbabilityInfo.cpp

llvm/test/Analysis/BranchProbabilityInfo/basic.ll

llvm/test/Analysis/BranchProbabilityInfo/noreturn.ll

llvm/test/CodeGen/X86/block-placement.ll

llvm/test/CodeGen/X86/pr37916.ll

llvm/test/CodeGen/X86/ragreedy-hoist-spill.ll

[BPI] Improve unreachable/ColdCall heurstics to handle loops.
ClosedPublic