Diff 378529

llvm/lib/Transforms/Scalar/DeadStoreElimination.cpp

Show First 20 Lines • Show All 1,838 Lines • ▼ Show 20 Lines

if (StoredConstant && StoredConstant->isNullValue()) {

return false;

auto *InnerCallee = Malloc->getCalledFunction();

if (!InnerCallee)

return false;

LibFunc Func;

if (!TLI.getLibFunc(*InnerCallee, Func) || !TLI.has(Func) ||

Func != LibFunc_malloc)

return false;

auto shouldCreateCalloc = [](CallInst *Malloc, CallInst *Memset) {

// Check for br(icmp ptr, null), truebb, falsebb) pattern at the end

// of malloc block

auto *MallocBB = Malloc->getParent(),

*MemsetBB = Memset->getParent();

if (MallocBB == MemsetBB)

return true;

auto *Ptr = Memset->getArgOperand(0);

xbolva00Unsubmitted

Done

hmm.. maybe rename this lambda as "shouldCreateCalloc" or "isProfitableToCreateCalloc" or something like that?

xbolva00: hmm.. maybe rename this lambda as "shouldCreateCalloc" or "isProfitableToCreateCalloc" or…

auto *TI = MallocBB->getTerminator();

ICmpInst::Predicate Pred;

BasicBlock *TrueBB, *FalseBB;

if (!match(TI, m_Br(m_ICmp(Pred, m_Specific(Ptr), m_Zero()), TrueBB,

FalseBB)))

return false;

if (Pred != ICmpInst::ICMP_EQ || MemsetBB != FalseBB)

return false;

return true;

xbolva00Unsubmitted

Done

m_Specific(Ptr->stripPointerCasts())),

Do we need it? Can it happen from C source?

float * ptr = (float*)malloc(N * sizeof(float));
                if (ptr != (float*)NULL) {
                    buf[i] = ptr;
                    memset(ptr,'\0',N);
                }

We have there:

%5 = tail call noalias align 16 i8* @malloc(i64 %4) #3
%6 = icmp eq i8* %5, null

xbolva00: m_Specific(Ptr->stripPointerCasts())), Do we need it? Can it happen from C source? ```…

yurai007AuthorUnsubmitted

Done

Right, given that memset always takes i8* (modulo alignment) no reason to assume in-between casting.

yurai007: Right, given that memset always takes i8* (modulo alignment) no reason to assume in-between…

nikicUnsubmitted

Not Done

return false;

- if (Pred != ICmpInst::ICMP_EQ || MemsetBB != FalseBB)

- return false;

- return true;

+ return Pred == ICmpInst::ICMP_EQ && MemsetBB == FalseBB;

};

if (Malloc->getOperand(0) == MemSet->getLength()) {

nikic:

};

if (Malloc->getOperand(0) == MemSet->getLength()) {

if (DT.dominates(Malloc, MemSet) && PDT.dominates(MemSet, Malloc) &&

if (shouldCreateCalloc(Malloc, MemSet) &&

xbolva00Unsubmitted

Done

You dont need to check for NE, as EQ is canonical. EQ is NE with swapped BBs.

xbolva00: You dont need to check for NE, as EQ is canonical. EQ is NE with swapped BBs.

DT.dominates(Malloc, MemSet) &&

memoryIsNotModifiedBetween(Malloc, MemSet, BatchAA, DL, &DT)) {

xbolva00Unsubmitted

Done

Check that BB2 (False BB) must be MemsetBB?

xbolva00: Check that BB2 (False BB) must be MemsetBB?

IRBuilder<> IRB(Malloc);

const auto &DL = Malloc->getModule()->getDataLayout();

if (auto *Calloc =

emitCalloc(ConstantInt::get(IRB.getIntPtrTy(DL), 1),

Malloc->getArgOperand(0), IRB, TLI)) {

MemorySSAUpdater Updater(&MSSA);

auto *LastDef = cast<MemoryDef>(

Updater.getMemorySSA()->getMemoryAccess(Malloc));

▲ Show 20 Lines • Show All 337 Lines • Show Last 20 Lines

llvm/test/Transforms/DeadStoreElimination/noop-stores.ll

	Show First 20 Lines • Show All 399 Lines • ▼ Show 20 Lines
	if.then: ; preds = %entry			if.then: ; preds = %entry
	tail call void @llvm.memset.p0i8.i64(i8* nonnull align 16 %call, i8 0, i64 %mul, i1 false)			tail call void @llvm.memset.p0i8.i64(i8* nonnull align 16 %call, i8 0, i64 %mul, i1 false)
	br label %if.end			br label %if.end

	if.end: ; preds = %if.then, %entry			if.end: ; preds = %if.then, %entry
	ret i8* %call			ret i8* %call
	}			}

	; FIXME: malloc+memset are not currently transformed into calloc unless the
	; memset post-dominates the malloc.
	define float* @pr25892(i64 %size) {			define float* @pr25892(i64 %size) {
	; CHECK-LABEL: @pr25892(			; CHECK-LABEL: @pr25892(
	; CHECK: entry:			; CHECK: entry:
	; CHECK-NEXT: [[CALL:%.]] = call i8 @malloc(i64 [[SIZE:%.*]])			; CHECK-NEXT: [[CALL:%.]] = call i8 @calloc(i64 1, i64 [[SIZE:%.*]])
	; CHECK-NEXT: [[CMP:%.]] = icmp eq i8 [[CALL]], null			; CHECK-NEXT: [[CMP:%.]] = icmp eq i8 [[CALL]], null
	; CHECK-NEXT: br i1 [[CMP]], label [[CLEANUP:%.]], label [[IF_END:%.]]			; CHECK-NEXT: br i1 [[CMP]], label [[CLEANUP:%.]], label [[IF_END:%.]]
	; CHECK: if.end:			; CHECK: if.end:
	; CHECK-NEXT: [[BC:%.]] = bitcast i8 [[CALL]] to float*			; CHECK-NEXT: [[BC:%.]] = bitcast i8 [[CALL]] to float*
	; CHECK-NEXT: call void @llvm.memset.p0i8.i64(i8* %call, i8 0, i64 %size, i1 false)
	; CHECK-NEXT: br label [[CLEANUP]]			; CHECK-NEXT: br label [[CLEANUP]]
	; CHECK: cleanup:			; CHECK: cleanup:
	; CHECK-NEXT: [[RETVAL_0:%.]] = phi float [ [[BC]], [[IF_END]] ], [ null, [[ENTRY:%.*]] ]			; CHECK-NEXT: [[RETVAL_0:%.]] = phi float [ [[BC]], [[IF_END]] ], [ null, [[ENTRY:%.*]] ]
	; CHECK-NEXT: ret float* [[RETVAL_0]]			; CHECK-NEXT: ret float* [[RETVAL_0]]
	;			;
	entry:			entry:
	%call = call i8* @malloc(i64 %size) inaccessiblememonly			%call = call i8* @malloc(i64 %size) inaccessiblememonly
	%cmp = icmp eq i8* %call, null			%cmp = icmp eq i8* %call, null
	br i1 %cmp, label %cleanup, label %if.end			br i1 %cmp, label %cleanup, label %if.end
	if.end:			if.end:
	%bc = bitcast i8* %call to float*			%bc = bitcast i8* %call to float*
	call void @llvm.memset.p0i8.i64(i8* %call, i8 0, i64 %size, i1 false)			call void @llvm.memset.p0i8.i64(i8* %call, i8 0, i64 %size, i1 false)
	br label %cleanup			br label %cleanup
	cleanup:			cleanup:
	%retval.0 = phi float* [ %bc, %if.end ], [ null, %entry ]			%retval.0 = phi float* [ %bc, %if.end ], [ null, %entry ]
	ret float* %retval.0			ret float* %retval.0
	}			}

	define float* @pr25892_with_extra_store(i64 %size) {			define float* @pr25892_with_extra_store(i64 %size) {
	; CHECK-LABEL: @pr25892_with_extra_store(			; CHECK-LABEL: @pr25892_with_extra_store(
	; CHECK: entry:			; CHECK: entry:
	; CHECK-NEXT: [[CALL:%.]] = call i8 @malloc(i64 [[SIZE:%.*]])			; CHECK-NEXT: [[CALL:%.]] = call i8 @calloc(i64 1, i64 [[SIZE:%.*]])
	; CHECK-NEXT: [[CMP:%.]] = icmp eq i8 [[CALL]], null			; CHECK-NEXT: [[CMP:%.]] = icmp eq i8 [[CALL]], null
	; CHECK-NEXT: br i1 [[CMP]], label [[CLEANUP:%.]], label [[IF_END:%.]]			; CHECK-NEXT: br i1 [[CMP]], label [[CLEANUP:%.]], label [[IF_END:%.]]
	; CHECK: if.end:			; CHECK: if.end:
	; CHECK-NEXT: [[BC:%.]] = bitcast i8 [[CALL]] to float*			; CHECK-NEXT: [[BC:%.]] = bitcast i8 [[CALL]] to float*
	; CHECK-NEXT: call void @llvm.memset.p0i8.i64(i8* %call, i8 0, i64 %size, i1 false)
	; CHECK-NEXT: store i8 0, i8* %call, align 1
	; CHECK-NEXT: br label [[CLEANUP]]			; CHECK-NEXT: br label [[CLEANUP]]
	; CHECK: cleanup:			; CHECK: cleanup:
	; CHECK-NEXT: [[RETVAL_0:%.]] = phi float [ [[BC]], [[IF_END]] ], [ null, [[ENTRY:%.*]] ]			; CHECK-NEXT: [[RETVAL_0:%.]] = phi float [ [[BC]], [[IF_END]] ], [ null, [[ENTRY:%.*]] ]
	; CHECK-NEXT: ret float* [[RETVAL_0]]			; CHECK-NEXT: ret float* [[RETVAL_0]]
	;			;
	entry:			entry:
	%call = call i8* @malloc(i64 %size) inaccessiblememonly			%call = call i8* @malloc(i64 %size) inaccessiblememonly
	%cmp = icmp eq i8* %call, null			%cmp = icmp eq i8* %call, null
	br i1 %cmp, label %cleanup, label %if.end			br i1 %cmp, label %cleanup, label %if.end
	if.end:			if.end:
	%bc = bitcast i8* %call to float*			%bc = bitcast i8* %call to float*
	call void @llvm.memset.p0i8.i64(i8* %call, i8 0, i64 %size, i1 false)			call void @llvm.memset.p0i8.i64(i8* %call, i8 0, i64 %size, i1 false)
	store i8 0, i8* %call, align 1			store i8 0, i8* %call, align 1
	br label %cleanup			br label %cleanup
	cleanup:			cleanup:
	%retval.0 = phi float* [ %bc, %if.end ], [ null, %entry ]			%retval.0 = phi float* [ %bc, %if.end ], [ null, %entry ]
	ret float* %retval.0			ret float* %retval.0
	}			}

				; This should not create a calloc
				define i8* @malloc_with_no_nointer_null_check(i64 %0, i32 %1) {
				; CHECK-LABEL: @malloc_with_no_nointer_null_check
				; CHECK: entry:
				; CHECK-NEXT: [[CALL:%.]] = call i8 @malloc(i64 [[TMP0:%.*]])
				; CHECK-NEXT: [[A:%.]] = and i32 [[TMP1:%.]], 32
				; CHECK-NEXT: [[CMP:%.*]] = icmp eq i32 [[A]], 0
				; CHECK-NEXT: br i1 [[CMP]], label [[CLEANUP:%.]], label [[IF_END:%.]]
				; CHECK: if.end:
				; CHECK-NEXT: call void @llvm.memset.p0i8.i64(i8* [[CALL]], i8 0, i64 [[TMP0]], i1 false)
				; CHECK-NEXT: br label [[CLEANUP]]
				; CHECK: cleanup:
				; CHECK-NEXT: ret i8* [[CALL]]
				;
				entry:
				%call = call i8* @malloc(i64 %0) inaccessiblememonly
				%a = and i32 %1, 32
				%cmp = icmp eq i32 %a, 0
				br i1 %cmp, label %cleanup, label %if.end
				if.end:
				call void @llvm.memset.p0i8.i64(i8* %call, i8 0, i64 %0, i1 false)
				br label %cleanup
				cleanup:
				ret i8* %call
				}

	; PR50143			; PR50143
	define i8* @store_zero_after_calloc_inaccessiblememonly() {			define i8* @store_zero_after_calloc_inaccessiblememonly() {
	; CHECK-LABEL: @store_zero_after_calloc_inaccessiblememonly(			; CHECK-LABEL: @store_zero_after_calloc_inaccessiblememonly(
	; CHECK-NEXT: [[CALL:%.]] = tail call i8 @calloc(i64 1, i64 10) #[[ATTR6:[0-9]+]]			; CHECK-NEXT: [[CALL:%.]] = tail call i8 @calloc(i64 1, i64 10) #[[ATTR6:[0-9]+]]
	; CHECK-NEXT: store i8 0, i8* [[CALL]], align 1			; CHECK-NEXT: store i8 0, i8* [[CALL]], align 1
	; CHECK-NEXT: ret i8* [[CALL]]			; CHECK-NEXT: ret i8* [[CALL]]
	;			;
	%call = tail call i8* @calloc(i64 1, i64 10) inaccessiblememonly			%call = tail call i8* @calloc(i64 1, i64 10) inaccessiblememonly
	▲ Show 20 Lines • Show All 126 Lines • ▼ Show 20 Lines
	; CHECK-NEXT: call void @memset_pattern16(i8* [[CALL]], i8* [[PAT:%.*]], i64 40000)			; CHECK-NEXT: call void @memset_pattern16(i8* [[CALL]], i8* [[PAT:%.*]], i64 40000)
	; CHECK-NEXT: ret i8* [[CALL]]			; CHECK-NEXT: ret i8* [[CALL]]
	;			;
	%call = tail call i8* @calloc(i64 10000, i64 4) #1			%call = tail call i8* @calloc(i64 10000, i64 4) #1
	call void @llvm.memset.p0i8.i64(i8* align 4 %call, i8 0, i64 40000, i1 false)			call void @llvm.memset.p0i8.i64(i8* align 4 %call, i8 0, i64 40000, i1 false)
	call void @memset_pattern16(i8* %call, i8* %pat, i64 40000) #1			call void @memset_pattern16(i8* %call, i8* %pat, i64 40000) #1
	ret i8* %call			ret i8* %call
	}			}

				@n = global i32 0, align 4
				@a = external global i32, align 4
				@b = external global i32*, align 8

				; GCC calloc-1.c test case should create calloc
				define i8* @test_malloc_memset_to_calloc(i64* %0) {
				; CHECK-LABEL: @test_malloc_memset_to_calloc(
				; CHECK: entry:
				; CHECK-NEXT: [[TMP1:%.]] = load i32, i32 @n, align 4
				; CHECK-NEXT: [[TMP2:%.*]] = sext i32 [[TMP1]] to i64
				; CHECK-NEXT: [[CALLOC:%.]] = call i8 @calloc(i64 1, i64 [[TMP2]])
				; CHECK-NEXT: [[TMP3:%.]] = load i64, i64 [[TMP0:%.*]], align 8
				; CHECK-NEXT: [[TMP4:%.*]] = add nsw i64 [[TMP3]], 1
				; CHECK-NEXT: store i64 [[TMP4]], i64* [[TMP0]], align 8
				; CHECK-NEXT: [[TMP5:%.]] = icmp eq i8 [[CALLOC]], null
				; CHECK-NEXT: br i1 [[TMP5]], label [[IF_END:%.]], label [[IF_THEN:%.]]
				; CHECK: if.then: ; preds = %entry
				; CHECK-NEXT: [[TMP6:%.*]] = add nsw i64 [[TMP3]], 2
				; CHECK-NEXT: store i64 [[TMP6]], i64* [[TMP0]], align 8
				; CHECK-NEXT: store i32 2, i32* @a, align 4
				; CHECK-NEXT: [[TMP7:%.]] = load i32, i32** @b, align 8
				; CHECK-NEXT: store i32 3, i32* [[TMP7]], align 4
				; CHECK-NEXT: br label [[IF_END]]
				; CHECK: if.end: ; preds = %if.then, %entry
				; CHECK-NEXT: ret i8* [[CALLOC]]
				;
				entry:
				%1 = load i32, i32* @n, align 4
				%2 = sext i32 %1 to i64
				%3 = tail call i8* @malloc(i64 %2) inaccessiblememonly
				%4 = load i64, i64* %0, align 8
				%5 = add nsw i64 %4, 1
				store i64 %5, i64* %0, align 8
				%6 = icmp eq i8* %3, null
				br i1 %6, label %if.end, label %if.then

				if.then:
				%7 = add nsw i64 %4, 2
				store i64 %7, i64* %0, align 8
				store i32 2, i32* @a, align 4
				tail call void @llvm.memset.p0i8.i64(i8* align 4 %3, i8 0, i64 %2, i1 false)
				%8 = load i32, i32* @b, align 8
				store i32 3, i32* %8, align 4
				br label %if.end

				if.end:
				ret i8* %3
				}

This is an archive of the discontinued LLVM Phabricator instance.

[DSE] Re-enable calloc transformation with extra care (PR25892)
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 378529

llvm/lib/Transforms/Scalar/DeadStoreElimination.cpp

llvm/test/Transforms/DeadStoreElimination/noop-stores.ll

This is an archive of the discontinued LLVM Phabricator instance.

[DSE] Re-enable calloc transformation with extra care (PR25892)ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 378529

llvm/lib/Transforms/Scalar/DeadStoreElimination.cpp

llvm/test/Transforms/DeadStoreElimination/noop-stores.ll

[DSE] Re-enable calloc transformation with extra care (PR25892)
ClosedPublic