This is an archive of the discontinued LLVM Phabricator instance.

Add alloca size threshold for StackTagging initializer merging.
AcceptedPublic

Authored by eugenis on Oct 15 2020, 4:26 PM.

Download Raw Diff

Details

Reviewers

vitalybuka
pcc

Summary

Initializer merging generates pretty inefficient code for large allocas
that also happens to trigger an exponential algorithm somewhere in
Machine Instruction Scheduler. See https://bugs.llvm.org/show_bug.cgi?id=47867.

This change adds an upper limit for the alloca size. The default limit
is selected such that worst case size of memtag-generated code is
similar to non-memtag (but because of the ISA quirks, this case is
realized at the different value of alloca size, ex. memset inlining
triggers at sizes below 512, but stack tagging instructions are 2x
shorter, so limit is approx. 256).

We could try harder to emit more compact code with initializer merging,
but that would only affect large, sparsely initialized allocas, and
those are doing fine already.

Diff Detail

Repository: rG LLVM Github Monorepo

Event Timeline

eugenis created this revision.Oct 15 2020, 4:26 PM

Herald added a project: Restricted Project. · View Herald TranscriptOct 15 2020, 4:26 PM

Herald added a subscriber: hiraditya. · View Herald Transcript

Harbormaster completed remote builds in B75241: Diff 298510.Oct 15 2020, 4:56 PM

Harbormaster completed remote builds in B75242: Diff 298511.Oct 15 2020, 5:01 PM

Harbormaster completed remote builds in B75340: Diff 298687.Oct 16 2020, 12:38 PM

ping

vitalybuka accepted this revision.Oct 19 2020, 1:07 PM

This revision is now accepted and ready to land.Oct 19 2020, 1:07 PM

Revision Contents

Path

Size

llvm/

lib/

Target/

AArch64/

AArch64StackTagging.cpp

7 lines

test/

CodeGen/

AArch64/

stack-tagging-initializer-merge.ll

14 lines

Diff 298510

llvm/lib/Target/AArch64/AArch64StackTagging.cpp

Show First 20 Lines • Show All 67 Lines • ▼ Show 20 Lines
static cl::opt<bool>		static cl::opt<bool>
ClUseStackSafety("stack-tagging-use-stack-safety", cl::Hidden,		ClUseStackSafety("stack-tagging-use-stack-safety", cl::Hidden,
cl::init(true), cl::ZeroOrMore,		cl::init(true), cl::ZeroOrMore,
cl::desc("Use Stack Safety analysis results"));		cl::desc("Use Stack Safety analysis results"));

static cl::opt<unsigned> ClScanLimit("stack-tagging-merge-init-scan-limit",		static cl::opt<unsigned> ClScanLimit("stack-tagging-merge-init-scan-limit",
cl::init(40), cl::Hidden);		cl::init(40), cl::Hidden);

		static cl::opt<unsigned>
		ClMergeInitSizeLimit("stack-tagging-merge-init-size-limit", cl::init(272),
		cl::Hidden);

static const Align kTagGranuleSize = Align(16);		static const Align kTagGranuleSize = Align(16);

namespace {		namespace {

class InitializerBuilder {		class InitializerBuilder {
uint64_t Size;		uint64_t Size;
const DataLayout *DL;		const DataLayout *DL;
Value *BasePtr;		Value *BasePtr;
▲ Show 20 Lines • Show All 345 Lines • ▼ Show 20 Lines	auto SetTagZeroFunc =
Intrinsic::getDeclaration(F->getParent(), Intrinsic::aarch64_settag_zero);		Intrinsic::getDeclaration(F->getParent(), Intrinsic::aarch64_settag_zero);
auto StgpFunc =		auto StgpFunc =
Intrinsic::getDeclaration(F->getParent(), Intrinsic::aarch64_stgp);		Intrinsic::getDeclaration(F->getParent(), Intrinsic::aarch64_stgp);

InitializerBuilder IB(Size, DL, Ptr, SetTagFunc, SetTagZeroFunc, StgpFunc);		InitializerBuilder IB(Size, DL, Ptr, SetTagFunc, SetTagZeroFunc, StgpFunc);
bool LittleEndian =		bool LittleEndian =
Triple(AI->getModule()->getTargetTriple()).isLittleEndian();		Triple(AI->getModule()->getTargetTriple()).isLittleEndian();
// Current implementation of initializer merging assumes little endianness.		// Current implementation of initializer merging assumes little endianness.
if (MergeInit && !F->hasOptNone() && LittleEndian) {		if (MergeInit && !F->hasOptNone() && LittleEndian &&
		Size < ClMergeInitSizeLimit) {
LLVM_DEBUG(dbgs() << "collecting initializers for " << *AI		LLVM_DEBUG(dbgs() << "collecting initializers for " << *AI
<< ", size = " << Size << "\n");		<< ", size = " << Size << "\n");
InsertBefore = collectInitializers(InsertBefore, Ptr, Size, IB);		InsertBefore = collectInitializers(InsertBefore, Ptr, Size, IB);
}		}

IRBuilder<> IRB(InsertBefore);		IRBuilder<> IRB(InsertBefore);
IB.generate(IRB);		IB.generate(IRB);
}		}
▲ Show 20 Lines • Show All 268 Lines • Show Last 20 Lines

llvm/test/CodeGen/AArch64/stack-tagging-initializer-merge.ll

Show First 20 Lines • Show All 300 Lines • ▼ Show 20 Lines	entry:
call void @use(i8* nonnull %0)		call void @use(i8* nonnull %0)
ret void		ret void
}		}

; CHECK-LABEL: define void @MemSetNonZero3(		; CHECK-LABEL: define void @MemSetNonZero3(
; CHECK: call void @llvm.aarch64.stgp(i8* {{.*}}, i64 46360584388608, i64 0)		; CHECK: call void @llvm.aarch64.stgp(i8* {{.*}}, i64 46360584388608, i64 0)
; CHECK: call void @llvm.aarch64.stgp(i8* {{.*}}, i64 0, i64 3038287259199220266)		; CHECK: call void @llvm.aarch64.stgp(i8* {{.*}}, i64 0, i64 3038287259199220266)
; CHECK: ret void		; CHECK: ret void

		define void @LargeAlloca() sanitize_memtag {
		entry:
		%x = alloca i32, i32 256, align 16
		%0 = bitcast i32* %x to i8*
		call void @llvm.memset.p0i8.i64(i8* nonnull align 16 %0, i8 42, i64 256, i1 false)
		call void @use(i8* nonnull %0)
		ret void
		}

		; CHECK-LABEL: define void @LargeAlloca(
		; CHECK: call void @llvm.aarch64.settag(i8* {{.*}}, i64 1024)
		; CHECK: call void @llvm.memset.p0i8.i64(i8* {{.*}}, i8 42, i64 256,
		; CHECK: ret void