This is an archive of the discontinued LLVM Phabricator instance.

Differential D16763

[X86] Optimize WinEH state stores
ClosedPublic

Authored by majnemer on Jan 31 2016, 9:33 PM.

Download Raw Diff

Details

Reviewers

rnk

Commits

rG7e5937b77541: [WinEH] Optimize WinEH state stores
rL261122: [WinEH] Optimize WinEH state stores

Summary

32-bit x86 Windows targets use a linked-list of nodes allocated on the
stack, referenced to via thread-local storage. The personality routine
interprets one of the fields in the node as a 'state number' which
indicates where the personality routine should transfer control.

State transitions are possible only before call-sites which may throw
exceptions. Our previous scheme had us update the state number before
all call-sites which may throw.

Instead, we can try to minimize the number of times we need to store by
reasoning about the nearest store which dominates the current call-site.
If the last store agrees with the current call-site, then we know that
the state-update is redundant and can be elided.

This is largely straightforward: a RPO walk of the blocks allows us to
correctly forward propagate the information when the function is a DAG.
Currently, loops are not handled optimally and may trigger superfluous
state stores.

Diff Detail

Event Timeline

majnemer updated this revision to Diff 46508.Jan 31 2016, 9:33 PM

majnemer retitled this revision from to [X86] Optimize WinEH state stores.

majnemer updated this object.

majnemer added a reviewer: rnk.

majnemer added a subscriber: llvm-commits.

rnk added inline comments.Feb 2 2016, 1:27 PM

lib/Target/X86/X86WinEHState.cpp
505	I'm not really a fan of all these long inline lambdas. I'd rather see this out of line, despite the paramter passing boilerplate: static int getBaseStateForBB(... BBColors, ... FuncInfo, BasicBlock *BB) { ... } You can practically guess the algorithm it's implementing from that prototype.
583	ditto
610	For SEH, I think we need state insertions prior to nounwind calls. This is the case I'm thinking of: void f() { __try { crash(); } __except(1) { } printf("%s\n", nullptr); } The printf call will crash, and it should not end up being caught by the __except block. It needs a -1 store, despite being nounwind. You can avoid state stores prior to intrinsic calls in SEH though. I guess this is a pre-existing bug.
634	grumble grumble
test/CodeGen/WinEH/wineh-statenumbering.ll
137	We should probably add a non-trivial case like: void f(int cond) { if (cond) { __try { crash(); } __except(1) { } } g(); // need -1 store before g }

Address review feedback

lgtm, now our code won't be totally bone-headed. :)

This revision is now accepted and ready to land.Feb 16 2016, 4:39 PM

Closed by commit rL261122: [WinEH] Optimize WinEH state stores (authored by majnemer). · Explain WhyFeb 17 2016, 10:41 AM

This revision was automatically updated to reflect the committed changes.

Revision Contents

Path

Size

lib/

Target/

X86/

X86WinEHState.cpp

207 lines

test/

CodeGen/

WinEH/

wineh-statenumbering.ll

72 lines

X86/

cleanuppad-inalloca.ll

2 lines

Diff 48043

lib/Target/X86/X86WinEHState.cpp

Show All 9 Lines
// All functions using an MSVC EH personality use an explicitly updated state		// All functions using an MSVC EH personality use an explicitly updated state
// number stored in an exception registration stack object. The registration		// number stored in an exception registration stack object. The registration
// object is linked into a thread-local chain of registrations stored at fs:00.		// object is linked into a thread-local chain of registrations stored at fs:00.
// This pass adds the registration object and EH state updates.		// This pass adds the registration object and EH state updates.
//		//
//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//

#include "X86.h"		#include "X86.h"
		#include "llvm/ADT/PostOrderIterator.h"
		#include "llvm/Analysis/CFG.h"
#include "llvm/Analysis/EHPersonalities.h"		#include "llvm/Analysis/EHPersonalities.h"
#include "llvm/CodeGen/MachineModuleInfo.h"		#include "llvm/CodeGen/MachineModuleInfo.h"
#include "llvm/CodeGen/WinEHFuncInfo.h"		#include "llvm/CodeGen/WinEHFuncInfo.h"
		#include "llvm/IR/CallSite.h"
		#include "llvm/IR/Function.h"
#include "llvm/IR/Instructions.h"		#include "llvm/IR/Instructions.h"
#include "llvm/IR/IntrinsicInst.h"		#include "llvm/IR/IntrinsicInst.h"
#include "llvm/IR/IRBuilder.h"		#include "llvm/IR/IRBuilder.h"
#include "llvm/IR/Module.h"		#include "llvm/IR/Module.h"
#include "llvm/Pass.h"		#include "llvm/Pass.h"
		#include "llvm/Support/Debug.h"
		#include <deque>

using namespace llvm;		using namespace llvm;

#define DEBUG_TYPE "winehstate"		#define DEBUG_TYPE "winehstate"

namespace llvm {		namespace llvm {
void initializeWinEHStatePassPass(PassRegistry &);		void initializeWinEHStatePassPass(PassRegistry &);
}		}

namespace {		namespace {
		const int OverdefinedState = INT_MIN;

class WinEHStatePass : public FunctionPass {		class WinEHStatePass : public FunctionPass {
public:		public:
static char ID; // Pass identification, replacement for typeid.		static char ID; // Pass identification, replacement for typeid.

WinEHStatePass() : FunctionPass(ID) {		WinEHStatePass() : FunctionPass(ID) {
initializeWinEHStatePassPass(*PassRegistry::getPassRegistry());		initializeWinEHStatePassPass(*PassRegistry::getPassRegistry());
}		}

Show All 33 Lines	private:
StructType *SEHRegistrationTy = nullptr;		StructType *SEHRegistrationTy = nullptr;
Function *FrameRecover = nullptr;		Function *FrameRecover = nullptr;
Function *FrameAddress = nullptr;		Function *FrameAddress = nullptr;
Function *FrameEscape = nullptr;		Function *FrameEscape = nullptr;

// Per-function state		// Per-function state
EHPersonality Personality = EHPersonality::Unknown;		EHPersonality Personality = EHPersonality::Unknown;
Function *PersonalityFn = nullptr;		Function *PersonalityFn = nullptr;
		bool UseStackGuard = false;
		int ParentBaseState;

/// The stack allocation containing all EH data, including the link in the		/// The stack allocation containing all EH data, including the link in the
/// fs:00 chain and the current state.		/// fs:00 chain and the current state.
AllocaInst *RegNode = nullptr;		AllocaInst *RegNode = nullptr;

/// The index of the state field of RegNode.		/// The index of the state field of RegNode.
int StateFieldIndex = ~0U;		int StateFieldIndex = ~0U;

▲ Show 20 Lines • Show All 72 Lines • ▼ Show 20 Lines	bool WinEHStatePass::runOnFunction(Function &F) {
// will be in trouble. If this assumption is ever broken, we should turn the		// will be in trouble. If this assumption is ever broken, we should turn the
// numbers into an immutable analysis pass.		// numbers into an immutable analysis pass.
WinEHFuncInfo FuncInfo;		WinEHFuncInfo FuncInfo;
addStateStores(F, FuncInfo);		addStateStores(F, FuncInfo);

// Reset per-function state.		// Reset per-function state.
PersonalityFn = nullptr;		PersonalityFn = nullptr;
Personality = EHPersonality::Unknown;		Personality = EHPersonality::Unknown;
		UseStackGuard = false;
return true;		return true;
}		}

/// Get the common EH registration subobject:		/// Get the common EH registration subobject:
/// typedef _EXCEPTION_DISPOSITION (*PEXCEPTION_ROUTINE)(		/// typedef _EXCEPTION_DISPOSITION (*PEXCEPTION_ROUTINE)(
/// _EXCEPTION_RECORD , void , _CONTEXT , void );		/// _EXCEPTION_RECORD , void , _CONTEXT , void );
/// struct EHRegistrationNode {		/// struct EHRegistrationNode {
/// EHRegistrationNode *Next;		/// EHRegistrationNode *Next;
▲ Show 20 Lines • Show All 61 Lines • ▼ Show 20 Lines
// and after that is personality function specific.		// and after that is personality function specific.
void WinEHStatePass::emitExceptionRegistrationRecord(Function *F) {		void WinEHStatePass::emitExceptionRegistrationRecord(Function *F) {
assert(Personality == EHPersonality::MSVC_CXX \|\|		assert(Personality == EHPersonality::MSVC_CXX \|\|
Personality == EHPersonality::MSVC_X86SEH);		Personality == EHPersonality::MSVC_X86SEH);

// Struct type of RegNode. Used for GEPing.		// Struct type of RegNode. Used for GEPing.
Type *RegNodeTy;		Type *RegNodeTy;

StringRef PersonalityName = PersonalityFn->getName();
IRBuilder<> Builder(&F->getEntryBlock(), F->getEntryBlock().begin());		IRBuilder<> Builder(&F->getEntryBlock(), F->getEntryBlock().begin());
Type *Int8PtrType = Builder.getInt8PtrTy();		Type *Int8PtrType = Builder.getInt8PtrTy();
if (Personality == EHPersonality::MSVC_CXX) {		if (Personality == EHPersonality::MSVC_CXX) {
RegNodeTy = getCXXEHRegistrationType();		RegNodeTy = getCXXEHRegistrationType();
RegNode = Builder.CreateAlloca(RegNodeTy);		RegNode = Builder.CreateAlloca(RegNodeTy);
// SavedESP = llvm.stacksave()		// SavedESP = llvm.stacksave()
Value *SP = Builder.CreateCall(		Value *SP = Builder.CreateCall(
Intrinsic::getDeclaration(TheModule, Intrinsic::stacksave), {});		Intrinsic::getDeclaration(TheModule, Intrinsic::stacksave), {});
Builder.CreateStore(SP, Builder.CreateStructGEP(RegNodeTy, RegNode, 0));		Builder.CreateStore(SP, Builder.CreateStructGEP(RegNodeTy, RegNode, 0));
// TryLevel = -1		// TryLevel = -1
StateFieldIndex = 2;		StateFieldIndex = 2;
insertStateNumberStore(&*Builder.GetInsertPoint(), -1);		ParentBaseState = -1;
		insertStateNumberStore(&*Builder.GetInsertPoint(), ParentBaseState);
// Handler = __ehhandler$F		// Handler = __ehhandler$F
Function *Trampoline = generateLSDAInEAXThunk(F);		Function *Trampoline = generateLSDAInEAXThunk(F);
Link = Builder.CreateStructGEP(RegNodeTy, RegNode, 1);		Link = Builder.CreateStructGEP(RegNodeTy, RegNode, 1);
linkExceptionRegistration(Builder, Trampoline);		linkExceptionRegistration(Builder, Trampoline);
} else if (Personality == EHPersonality::MSVC_X86SEH) {		} else if (Personality == EHPersonality::MSVC_X86SEH) {
// If _except_handler4 is in use, some additional guard checks and prologue		// If _except_handler4 is in use, some additional guard checks and prologue
// stuff is required.		// stuff is required.
bool UseStackGuard = (PersonalityName == "_except_handler4");
RegNodeTy = getSEHRegistrationType();		RegNodeTy = getSEHRegistrationType();
RegNode = Builder.CreateAlloca(RegNodeTy);		RegNode = Builder.CreateAlloca(RegNodeTy);
// SavedESP = llvm.stacksave()		// SavedESP = llvm.stacksave()
Value *SP = Builder.CreateCall(		Value *SP = Builder.CreateCall(
Intrinsic::getDeclaration(TheModule, Intrinsic::stacksave), {});		Intrinsic::getDeclaration(TheModule, Intrinsic::stacksave), {});
Builder.CreateStore(SP, Builder.CreateStructGEP(RegNodeTy, RegNode, 0));		Builder.CreateStore(SP, Builder.CreateStructGEP(RegNodeTy, RegNode, 0));
// TryLevel = -2 / -1		// TryLevel = -2 / -1
StateFieldIndex = 4;		StateFieldIndex = 4;
insertStateNumberStore(&*Builder.GetInsertPoint(), UseStackGuard ? -2 : -1);		StringRef PersonalityName = PersonalityFn->getName();
		UseStackGuard = (PersonalityName == "_except_handler4");
		ParentBaseState = UseStackGuard ? -2 : -1;
		insertStateNumberStore(&*Builder.GetInsertPoint(), ParentBaseState);
// ScopeTable = llvm.x86.seh.lsda(F)		// ScopeTable = llvm.x86.seh.lsda(F)
Value *FI8 = Builder.CreateBitCast(F, Int8PtrType);		Value *FI8 = Builder.CreateBitCast(F, Int8PtrType);
Value *LSDA = Builder.CreateCall(		Value *LSDA = Builder.CreateCall(
Intrinsic::getDeclaration(TheModule, Intrinsic::x86_seh_lsda), FI8);		Intrinsic::getDeclaration(TheModule, Intrinsic::x86_seh_lsda), FI8);
Type *Int32Ty = Type::getInt32Ty(TheModule->getContext());		Type *Int32Ty = Type::getInt32Ty(TheModule->getContext());
LSDA = Builder.CreatePtrToInt(LSDA, Int32Ty);		LSDA = Builder.CreatePtrToInt(LSDA, Int32Ty);
// If using _except_handler4, xor the address of the table with		// If using _except_handler4, xor the address of the table with
// __security_cookie.		// __security_cookie.
▲ Show 20 Lines • Show All 95 Lines • ▼ Show 20 Lines	void WinEHStatePass::unlinkExceptionRegistration(IRBuilder<> &Builder) {
// [fs:00] = Link->Next		// [fs:00] = Link->Next
Value *Next =		Value *Next =
Builder.CreateLoad(Builder.CreateStructGEP(LinkTy, Link, 0));		Builder.CreateLoad(Builder.CreateStructGEP(LinkTy, Link, 0));
Constant *FSZero =		Constant *FSZero =
Constant::getNullValue(LinkTy->getPointerTo()->getPointerTo(257));		Constant::getNullValue(LinkTy->getPointerTo()->getPointerTo(257));
Builder.CreateStore(Next, FSZero);		Builder.CreateStore(Next, FSZero);
}		}

		// Figure out what state we should assign calls in this block.
		static int getBaseStateForBB(DenseMap<BasicBlock *, ColorVector> &BlockColors,
		WinEHFuncInfo &FuncInfo, BasicBlock *BB) {
		int BaseState = -1;
		auto &BBColors = BlockColors[BB];

		assert(BBColors.size() == 1 && "multi-color BB not removed by preparation");
		BasicBlock *FuncletEntryBB = BBColors.front();
		if (auto *FuncletPad =
		dyn_cast<FuncletPadInst>(FuncletEntryBB->getFirstNonPHI())) {
		auto BaseStateI = FuncInfo.FuncletBaseStateMap.find(FuncletPad);
		if (BaseStateI != FuncInfo.FuncletBaseStateMap.end())
		BaseState = BaseStateI->second;
		}

		return BaseState;
		}

		// Calculate the state a call-site is in.
		static int getStateForCallSite(DenseMap<BasicBlock *, ColorVector> &BlockColors,
		WinEHFuncInfo &FuncInfo, CallSite CS) {
		if (auto *II = dyn_cast<InvokeInst>(CS.getInstruction())) {
		// Look up the state number of the EH pad this unwinds to.
		assert(FuncInfo.InvokeStateMap.count(II) && "invoke has no state!");
		return FuncInfo.InvokeStateMap[II];
		}
		// Possibly throwing call instructions have no actions to take after
		// an unwind. Ensure they are in the -1 state.
		return getBaseStateForBB(BlockColors, FuncInfo, CS.getParent());
		}

		// Calculate the intersection of all the FinalStates for a BasicBlock's
		// predecessor.
		static int getPredState(DenseMap<BasicBlock *, int> &FinalStates, Function &F,
		int ParentBaseState, BasicBlock *BB) {
		// The entry block has no predecessors but we know that the prologue always
		// sets us up with a fixed state.
		if (&F.getEntryBlock() == BB)
		return ParentBaseState;

		// This is an EH Pad, conservatively report this basic block as overdefined.
		if (BB->isEHPad())
		return OverdefinedState;

		int CommonState = OverdefinedState;
		for (BasicBlock *PredBB : predecessors(BB)) {
		// We didn't manage to get a state for one of these predecessors,
		// conservatively report this basic block as overdefined.
		auto PredEndState = FinalStates.find(PredBB);
		if (PredEndState == FinalStates.end())
		return OverdefinedState;

		// This code is reachable via exceptional control flow,
		// conservatively report this basic block as overdefined.
		if (isa<CatchReturnInst>(PredBB->getTerminator()))
		return OverdefinedState;

		int PredState = PredEndState->second;
		assert(PredState != OverdefinedState &&
		"overdefined BBs shouldn't be in FinalStates");
		if (CommonState == OverdefinedState)
		CommonState = PredState;

		// At least two predecessors have different FinalStates,
		// conservatively report this basic block as overdefined.
		if (CommonState != PredState)
		return OverdefinedState;
		}

		return CommonState;
		};

		static bool isStateStoreNeeded(EHPersonality Personality, CallSite CS) {
		if (!CS)
		return false;

		if (isAsynchronousEHPersonality(Personality))
		return !CS.doesNotAccessMemory();

		return !CS.doesNotThrow();
		}

void WinEHStatePass::addStateStores(Function &F, WinEHFuncInfo &FuncInfo) {		void WinEHStatePass::addStateStores(Function &F, WinEHFuncInfo &FuncInfo) {
// Mark the registration node. The backend needs to know which alloca it is so		// Mark the registration node. The backend needs to know which alloca it is so
// that it can recover the original frame pointer.		// that it can recover the original frame pointer.
IRBuilder<> Builder(RegNode->getParent(), std::next(RegNode->getIterator()));		IRBuilder<> Builder(RegNode->getParent(), std::next(RegNode->getIterator()));
Value *RegNodeI8 = Builder.CreateBitCast(RegNode, Builder.getInt8PtrTy());		Value *RegNodeI8 = Builder.CreateBitCast(RegNode, Builder.getInt8PtrTy());
Builder.CreateCall(		Builder.CreateCall(
Intrinsic::getDeclaration(TheModule, Intrinsic::x86_seh_ehregnode),		Intrinsic::getDeclaration(TheModule, Intrinsic::x86_seh_ehregnode),
{RegNodeI8});		{RegNodeI8});

// Calculate state numbers.		// Calculate state numbers.
if (isAsynchronousEHPersonality(Personality))		if (isAsynchronousEHPersonality(Personality))
calculateSEHStateNumbers(&F, FuncInfo);		calculateSEHStateNumbers(&F, FuncInfo);
else		else
calculateWinCXXEHStateNumbers(&F, FuncInfo);		calculateWinCXXEHStateNumbers(&F, FuncInfo);

// Iterate all the instructions and emit state number stores.		// Iterate all the instructions and emit state number stores.
DenseMap<BasicBlock *, ColorVector> BlockColors = colorEHFunclets(F);		DenseMap<BasicBlock *, ColorVector> BlockColors = colorEHFunclets(F);
for (BasicBlock &BB : F) {		ReversePostOrderTraversal<Function *> RPOT(&F);
// Figure out what state we should assign calls in this block.
int BaseState = -1;
auto &BBColors = BlockColors[&BB];

assert(BBColors.size() == 1 &&		// InitialStates yields the state of the first call-site for a BasicBlock.
		rnkUnsubmitted Not Done Reply Inline Actions I'm not really a fan of all these long inline lambdas. I'd rather see this out of line, despite the paramter passing boilerplate: static int getBaseStateForBB(... BBColors, ... FuncInfo, BasicBlock BB) { ... } You can practically guess the algorithm it's implementing from that prototype. rnk:* I'm not really a fan of all these long inline lambdas. I'd rather see this out of line, despite…
"multi-color BB not removed by preparation");		DenseMap<BasicBlock *, int> InitialStates;
BasicBlock *FuncletEntryBB = BBColors.front();		// FinalStates yields the state of the last call-site for a BasicBlock.
if (auto *FuncletPad =		DenseMap<BasicBlock *, int> FinalStates;
dyn_cast<FuncletPadInst>(FuncletEntryBB->getFirstNonPHI())) {		// Worklist used to revisit BasicBlocks with indeterminate
// We do not support nesting funclets within cleanuppads.		// Initial/Final-States.
if (isa<CleanupPadInst>(FuncletPad))		std::deque<BasicBlock *> Worklist;
		// Fill in InitialStates and FinalStates for BasicBlocks with call-sites.
		for (BasicBlock *BB : RPOT) {
		int InitialState = OverdefinedState;
		int FinalState;
		if (&F.getEntryBlock() == BB)
		InitialState = FinalState = ParentBaseState;
		for (Instruction &I : *BB) {
		CallSite CS(&I);
		if (!isStateStoreNeeded(Personality, CS))
continue;		continue;

auto BaseStateI = FuncInfo.FuncletBaseStateMap.find(FuncletPad);		int State = getStateForCallSite(BlockColors, FuncInfo, CS);
if (BaseStateI != FuncInfo.FuncletBaseStateMap.end())		if (InitialState == OverdefinedState)
BaseState = BaseStateI->second;		InitialState = State;
		FinalState = State;
		}
		// No call-sites in this basic block? That's OK, we will come back to these
		// in a later pass.
		if (InitialState == OverdefinedState) {
		Worklist.push_back(BB);
		continue;
		}
		DEBUG(dbgs() << "X86WinEHState: " << BB->getName()
		<< " InitialState=" << InitialState << '\n');
		DEBUG(dbgs() << "X86WinEHState: " << BB->getName()
		<< " FinalState=" << FinalState << '\n');
		InitialStates.insert({BB, InitialState});
		FinalStates.insert({BB, FinalState});
}		}

for (Instruction &I : BB) {		// Try to fill-in InitialStates and FinalStates which have no call-sites.
if (auto *CI = dyn_cast<CallInst>(&I)) {		while (!Worklist.empty()) {
// Possibly throwing call instructions have no actions to take after		BasicBlock *BB = Worklist.front();
// an unwind. Ensure they are in the -1 state.		Worklist.pop_front();
if (CI->doesNotThrow())		// This BasicBlock has already been figured out, nothing more we can do.
		if (InitialStates.count(BB) != 0)
continue;		continue;
insertStateNumberStore(CI, BaseState);
} else if (auto *II = dyn_cast<InvokeInst>(&I)) {		int PredState = getPredState(FinalStates, F, ParentBaseState, BB);
// Look up the state number of the landingpad this unwinds to.		if (PredState == OverdefinedState)
assert(FuncInfo.InvokeStateMap.count(II) && "invoke has no state!");		continue;
int State = FuncInfo.InvokeStateMap[II];
insertStateNumberStore(II, State);		// We successfully inferred this BasicBlock's state via it's predecessors;
		// enqueue it's successors to see if we can infer their states.
		InitialStates.insert({BB, PredState});
		FinalStates.insert({BB, PredState});
		for (BasicBlock *SuccBB : successors(BB))
		Worklist.push_back(SuccBB);
}		}

		// Finally, insert state stores before call-sites which transition us to a new
		// state.
		for (BasicBlock *BB : RPOT) {
		auto &BBColors = BlockColors[BB];
		BasicBlock *FuncletEntryBB = BBColors.front();
		if (isa<CleanupPadInst>(FuncletEntryBB->getFirstNonPHI()))
		continue;

		int PrevState = getPredState(FinalStates, F, ParentBaseState, BB);
		DEBUG(dbgs() << "X86WinEHState: " << BB->getName()
		<< " PrevState=" << PrevState << '\n');

		for (Instruction &I : *BB) {
		CallSite CS(&I);
		if (!isStateStoreNeeded(Personality, CS))
		continue;

		int State = getStateForCallSite(BlockColors, FuncInfo, CS);
		if (State != PrevState)
		insertStateNumberStore(&I, State);
		PrevState = State;
}		}
		rnkUnsubmitted Not Done Reply Inline Actions ditto rnk: ditto
}		}
}		}

void WinEHStatePass::insertStateNumberStore(Instruction *IP, int State) {		void WinEHStatePass::insertStateNumberStore(Instruction *IP, int State) {
IRBuilder<> Builder(IP);		IRBuilder<> Builder(IP);
Value *StateField =		Value *StateField =
Builder.CreateStructGEP(nullptr, RegNode, StateFieldIndex);		Builder.CreateStructGEP(nullptr, RegNode, StateFieldIndex);
Builder.CreateStore(Builder.getInt32(State), StateField);		Builder.CreateStore(Builder.getInt32(State), StateField);
}		}
		rnkUnsubmitted Not Done Reply Inline Actions For SEH, I think we need state insertions prior to nounwind calls. This is the case I'm thinking of: void f() { __try { crash(); } __except(1) { } printf("%s\n", nullptr); } The printf call will crash, and it should not end up being caught by the __except block. It needs a -1 store, despite being nounwind. You can avoid state stores prior to intrinsic calls in SEH though. I guess this is a pre-existing bug. rnk: For SEH, I think we need state insertions prior to nounwind calls. This is the case I'm…
		rnkUnsubmitted Not Done Reply Inline Actions grumble grumble rnk: grumble grumble

test/CodeGen/WinEH/wineh-statenumbering.ll

	Show All 22 Lines
	@_TI1H = linkonce_odr unnamed_addr constant %eh.ThrowInfo { i32 0, i8* null, i8* null, i8* bitcast (%eh.CatchableTypeArray.1* @_CTA1H to i8*) }, section ".xdata", comdat			@_TI1H = linkonce_odr unnamed_addr constant %eh.ThrowInfo { i32 0, i8* null, i8* null, i8* bitcast (%eh.CatchableTypeArray.1* @_CTA1H to i8*) }, section ".xdata", comdat

	define i32 @main() #0 personality i32 (...)* @__CxxFrameHandler3 {			define i32 @main() #0 personality i32 (...)* @__CxxFrameHandler3 {
	entry:			entry:
	%tmp = alloca i32, align 4			%tmp = alloca i32, align 4
	; CHECK: entry:			; CHECK: entry:
	; CHECK: store i32 -1			; CHECK: store i32 -1
	; CHECK: call void @g(i32 3)			; CHECK: call void @g(i32 3)
				; CHECK-NEXT: call void @g(i32 4)
				; CHECK-NEXT: call void @g(i32 5)
	call void @g(i32 3)			call void @g(i32 3)
				call void @g(i32 4)
				call void @g(i32 5)
	store i32 0, i32* %tmp, align 4			store i32 0, i32* %tmp, align 4
	%0 = bitcast i32* %tmp to i8*			%0 = bitcast i32* %tmp to i8*
	; CHECK: store i32 0			; CHECK: store i32 0
	; CHECK: invoke void @_CxxThrowException(			; CHECK: invoke void @_CxxThrowException(
	invoke void @_CxxThrowException(i8* %0, %eh.ThrowInfo* nonnull @_TI1H) #1			invoke void @_CxxThrowException(i8* %0, %eh.ThrowInfo* nonnull @_TI1H) #1
	to label %unreachable.for.entry unwind label %catch.dispatch			to label %unreachable.for.entry unwind label %catch.dispatch

	catch.dispatch: ; preds = %entry			catch.dispatch: ; preds = %entry
	Show All 9 Lines

	catch.dispatch.1: ; preds = %catch			catch.dispatch.1: ; preds = %catch
	%cs2 = catchswitch within %1 [label %catch.3] unwind to caller			%cs2 = catchswitch within %1 [label %catch.3] unwind to caller
	catch.3: ; preds = %catch.dispatch.1			catch.3: ; preds = %catch.dispatch.1
	%2 = catchpad within %cs2 [i8* null, i32 u0x40, i8* null]			%2 = catchpad within %cs2 [i8* null, i32 u0x40, i8* null]
	; CHECK: catch.3:			; CHECK: catch.3:
	; CHECK: store i32 3			; CHECK: store i32 3
	; CHECK: call void @g(i32 1)			; CHECK: call void @g(i32 1)
				; CHECK-NEXT: call void @g(i32 2)
				; CHECK-NEXT: call void @g(i32 3)
	call void @g(i32 1)			call void @g(i32 1)
				call void @g(i32 2)
				call void @g(i32 3)
	catchret from %2 to label %try.cont			catchret from %2 to label %try.cont

	try.cont: ; preds = %catch.3			try.cont: ; preds = %catch.3
	; CHECK: try.cont:			; CHECK: try.cont:
	; CHECK: store i32 1			; CHECK: store i32 1
	; CHECK: call void @g(i32 2)			; CHECK: call void @g(i32 2)
				; CHECK-NEXT: call void @g(i32 3)
				; CHECK-NEXT: call void @g(i32 4)
	call void @g(i32 2)			call void @g(i32 2)
				call void @g(i32 3)
				call void @g(i32 4)
	unreachable			unreachable

	unreachable: ; preds = %catch			unreachable: ; preds = %catch
	unreachable			unreachable

	unreachable.for.entry: ; preds = %entry			unreachable.for.entry: ; preds = %entry
	unreachable			unreachable
	}			}
	Show All 33 Lines
	catch2: ; preds = %catch.dispatch1			catch2: ; preds = %catch.dispatch1
	%3 = catchpad within %2 [i8* null, i32 64, i8* null]			%3 = catchpad within %2 [i8* null, i32 64, i8* null]
	catchret from %3 to label %try.cont			catchret from %3 to label %try.cont

	try.cont: ; preds = %catch2			try.cont: ; preds = %catch2
	; CHECK: try.cont:			; CHECK: try.cont:
	; CHECK: store i32 1			; CHECK: store i32 1
	; CHECK: call void @dtor()			; CHECK: call void @dtor()
				; CHECK-NEXT: call void @dtor()
				; CHECK-NEXT: call void @dtor()
				call void @dtor() #3 [ "funclet"(token %1) ]
				call void @dtor() #3 [ "funclet"(token %1) ]
	call void @dtor() #3 [ "funclet"(token %1) ]			call void @dtor() #3 [ "funclet"(token %1) ]
	catchret from %1 to label %try.cont4			catchret from %1 to label %try.cont4

	try.cont4: ; preds = %try.cont			try.cont4: ; preds = %try.cont
	ret void			ret void

	ehcleanup: ; preds = %catch.dispatch1			ehcleanup: ; preds = %catch.dispatch1
	%4 = cleanuppad within %1 []			%4 = cleanuppad within %1 []
				rnkUnsubmitted Not Done Reply Inline Actions We should probably add a non-trivial case like: void f(int cond) { if (cond) { __try { crash(); } __except(1) { } } g(); // need -1 store before g } rnk: We should probably add a non-trivial case like: void f(int cond) { if (cond) { __try {…
	; CHECK: ehcleanup:			; CHECK: ehcleanup:
	; CHECK: call void @dtor()			; CHECK: call void @dtor()
	call void @dtor() #3 [ "funclet"(token %4) ]			call void @dtor() #3 [ "funclet"(token %4) ]
	cleanupret from %4 unwind to caller			cleanupret from %4 unwind to caller

	unreachable: ; preds = %entry			unreachable: ; preds = %entry
	unreachable			unreachable

	unreachable1: ; preds = %catch			unreachable1: ; preds = %catch
	unreachable			unreachable
	}			}

				; CHECK-LABEL: define void @required_state_store(
				define void @required_state_store(i1 zeroext %cond) personality i32 (...)* @_except_handler3 {
				entry:
				%__exception_code = alloca i32, align 4
				call void (...) @llvm.localescape(i32* nonnull %__exception_code)
				; CHECK: store i32 -1
				; CHECK: call void @g(i32 0)
				call void @g(i32 0)
				br i1 %cond, label %if.then, label %if.end

				if.then: ; preds = %entry
				; CHECK: store i32 0
				; CHECK-NEXT: invoke void @g(i32 1)
				invoke void @g(i32 1)
				to label %if.end unwind label %catch.dispatch

				catch.dispatch: ; preds = %if.then
				%0 = catchswitch within none [label %__except.ret] unwind to caller

				__except.ret: ; preds = %catch.dispatch
				%1 = catchpad within %0 [i8* bitcast (i32 ()* @"\01?filt$0@0@required_state_store@@" to i8*)]
				catchret from %1 to label %if.end

				if.end: ; preds = %if.then, %__except.ret, %entry
				; CHECK: store i32 -1
				; CHECK-NEXT: call void @dtor()
				call void @dtor()
				ret void
				}

				define internal i32 @"\01?filt$0@0@required_state_store@@"() {
				entry:
				%0 = tail call i8* @llvm.frameaddress(i32 1)
				%1 = tail call i8* @llvm.x86.seh.recoverfp(i8* bitcast (void (i1)* @required_state_store to i8), i8 %0)
				%2 = tail call i8* @llvm.localrecover(i8* bitcast (void (i1)* @required_state_store to i8), i8 %1, i32 0)
				%__exception_code = bitcast i8* %2 to i32*
				%3 = getelementptr inbounds i8, i8* %0, i32 -20
				%4 = bitcast i8* %3 to { i32, i8 }**
				%5 = load { i32, i8 }, { i32, i8* }** %4, align 4
				%6 = getelementptr inbounds { i32, i8 }, { i32, i8 }* %5, i32 0, i32 0
				%7 = load i32, i32* %6, align 4
				%8 = load i32, i32* %7, align 4
				store i32 %8, i32* %__exception_code, align 4
				ret i32 1
				}

	declare void @g(i32) #0			declare void @g(i32) #0

	declare void @dtor()			declare void @dtor()

	declare x86_stdcallcc void @_CxxThrowException(i8, %eh.ThrowInfo)			declare x86_stdcallcc void @_CxxThrowException(i8, %eh.ThrowInfo)

	declare i32 @__CxxFrameHandler3(...)			declare i32 @__CxxFrameHandler3(...)

				declare i8* @llvm.frameaddress(i32)

				declare i8* @llvm.x86.seh.recoverfp(i8, i8)

				declare i8* @llvm.localrecover(i8, i8, i32)

				declare void @llvm.localescape(...)

				declare i32 @_except_handler3(...)

	attributes #0 = { "disable-tail-calls"="false" "less-precise-fpmad"="false" "no-frame-pointer-elim"="false" "no-infs-fp-math"="false" "no-nans-fp-math"="false" "no-realign-stack" "stack-protector-buffer-size"="8" "unsafe-fp-math"="false" "use-soft-float"="false" }			attributes #0 = { "disable-tail-calls"="false" "less-precise-fpmad"="false" "no-frame-pointer-elim"="false" "no-infs-fp-math"="false" "no-nans-fp-math"="false" "no-realign-stack" "stack-protector-buffer-size"="8" "unsafe-fp-math"="false" "use-soft-float"="false" }
	attributes #1 = { noreturn }			attributes #1 = { noreturn }

	!llvm.ident = !{!0}			!llvm.ident = !{!0}

	!0 = !{!"clang version 3.8.0 (trunk 245153) (llvm/trunk 245238)"}			!0 = !{!"clang version 3.8.0 (trunk 245153) (llvm/trunk 245238)"}

test/CodeGen/X86/cleanuppad-inalloca.ll

	Show First 20 Lines • Show All 45 Lines • ▼ Show 20 Lines
	; ESP must be restored via EBP due to "dynamic" alloca.			; ESP must be restored via EBP due to "dynamic" alloca.
	; CHECK: leal -{{[0-9]+}}(%ebp), %esp			; CHECK: leal -{{[0-9]+}}(%ebp), %esp
	; CHECK: popl %ebp			; CHECK: popl %ebp
	; CHECK: retl			; CHECK: retl

	; CHECK: "?dtor$2@?0?passes_two@4HA":			; CHECK: "?dtor$2@?0?passes_two@4HA":
	; CHECK: pushl %ebp			; CHECK: pushl %ebp
	; CHECK: subl $8, %esp			; CHECK: subl $8, %esp
	; CHECK: addl $12, %ebp			; CHECK: addl $16, %ebp
	; CHECK: {{movl\|leal}} -{{[0-9]+}}(%ebp), %ecx			; CHECK: {{movl\|leal}} -{{[0-9]+}}(%ebp), %ecx
	; CHECK: calll "??1A@@QAE@XZ"			; CHECK: calll "??1A@@QAE@XZ"
	; CHECK: addl $8, %esp			; CHECK: addl $8, %esp
	; CHECK: retl			; CHECK: retl

	declare void @takes_two(<{ %struct.A, %struct.A }>* inalloca) #0			declare void @takes_two(<{ %struct.A, %struct.A }>* inalloca) #0

	declare x86_thiscallcc %struct.A* @"\01??0A@@QAE@XZ"(%struct.A* returned) #0			declare x86_thiscallcc %struct.A* @"\01??0A@@QAE@XZ"(%struct.A* returned) #0

	declare i32 @__CxxFrameHandler3(...)			declare i32 @__CxxFrameHandler3(...)

	declare x86_thiscallcc void @"\01??1A@@QAE@XZ"(%struct.A*) #0			declare x86_thiscallcc void @"\01??1A@@QAE@XZ"(%struct.A*) #0

	attributes #0 = { "disable-tail-calls"="false" "less-precise-fpmad"="false" "no-frame-pointer-elim"="false" "no-infs-fp-math"="false" "no-nans-fp-math"="false" "stack-protector-buffer-size"="8" "unsafe-fp-math"="false" "use-soft-float"="false" }			attributes #0 = { "disable-tail-calls"="false" "less-precise-fpmad"="false" "no-frame-pointer-elim"="false" "no-infs-fp-math"="false" "no-nans-fp-math"="false" "stack-protector-buffer-size"="8" "unsafe-fp-math"="false" "use-soft-float"="false" }