Diff 373613

llvm/lib/Transforms/Scalar/DeadStoreElimination.cpp

//===- DeadStoreElimination.cpp - MemorySSA Backed Dead Store Elimination -===//		//===- DeadStoreElimination.cpp - MemorySSA Backed Dead Store Elimination -===//
		Lint: Lint Inline Actions clang-format suggested style edits found: Lint: Lint: clang-format suggested style edits found:
//		//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.		// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.		// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception		// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//		//
//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//
//		//
// The code below implements dead store elimination using MemorySSA. It uses		// The code below implements dead store elimination using MemorySSA. It uses
▲ Show 20 Lines • Show All 858 Lines • ▼ Show 20 Lines	static PhiTransPtr phiTranslatePtr(const PhiTransPtr &Ptr, BasicBlock *FromBB,
}		}

WorkList.push_back({FromBB, Ptr});		WorkList.push_back({FromBB, Ptr});

while (!WorkList.empty()) {		while (!WorkList.empty()) {
auto CurrNode = WorkList.pop_back_val();		auto CurrNode = WorkList.pop_back_val();
BasicBlock *CurrBB = CurrNode.first;		BasicBlock *CurrBB = CurrNode.first;
const PhiTransPtr &CurrPtr = CurrNode.second;		const PhiTransPtr &CurrPtr = CurrNode.second;
		int64_t Offset = 0;
		Value *const BasePtr =
		GetPointerBaseWithConstantOffset(CurrPtr.first, Offset, DL);
		const int64_t BaseOffset = CurrPtr.second + Offset;

for (pred_iterator PI = pred_begin(CurrBB), E = pred_end(CurrBB); PI != E;		for (pred_iterator PI = pred_begin(CurrBB), E = pred_end(CurrBB); PI != E;
++PI) {		++PI) {
BasicBlock PredBB = PI;		BasicBlock PredBB = PI;
PHITransAddr TransAddr{CurrPtr.first, DL, AC};		PHITransAddr TransAddr{BasePtr, DL, AC};

// TODO:		// TODO:
if (!DT.dominates(ToBB, PredBB))		if (!DT.dominates(ToBB, PredBB))
continue;		continue;

if (TransAddr.NeedsPHITranslationFromBlock(CurrBB) &&		if (TransAddr.NeedsPHITranslationFromBlock(CurrBB) &&
(!TransAddr.IsPotentiallyPHITranslatable() \|\|		(!TransAddr.IsPotentiallyPHITranslatable() \|\|
TransAddr.PHITranslateValue(CurrBB, PredBB, &DT, false)))		TransAddr.PHITranslateValue(CurrBB, PredBB, &DT, false)))
return PhiTransPtr{};		return PhiTransPtr{};

auto Inserted =		auto Inserted =
Visited.try_emplace(PredBB, TransAddr.getAddr(), CurrPtr.second);		Visited.try_emplace(PredBB, TransAddr.getAddr(), BaseOffset);
auto &TransPtr = Inserted.first->second;		auto &TransPtr = Inserted.first->second;
if (!Inserted.second) {		if (!Inserted.second) {
if (TransAddr.getAddr() != TransPtr.first \|\|		if (TransAddr.getAddr() != TransPtr.first \|\|
CurrPtr.second != TransPtr.second)		BaseOffset != TransPtr.second)
// We already visited this block before. If it was with a different		// We already visited this block before. If it was with a different
// address - bail out!		// address - bail out!
return PhiTransPtr{};		return PhiTransPtr{};
continue;		continue;
}		}

if (PredBB == ToBB) {		if (PredBB == ToBB) {
ResPtr = TransPtr;		ResPtr = TransPtr;
continue;		continue;
}		}

WorkList.push_back({PredBB, TransPtr});		WorkList.push_back({PredBB, TransPtr});
}		}
}		}

assert(ResPtr.first.pointsToAliveValue() &&		assert(ResPtr.first.pointsToAliveValue() &&
"PHI translation is expected to complete successfully");		"PHI translation is expected to complete successfully");
assert(ResPtr.second == 0 &&
"Unexpected non-zero offset during phi translation");
return ResPtr;		return ResPtr;
}		}

static ExMemoryAccess		static ExMemoryAccess
phiTransFromMemoryAccessTo(const ExMemoryAccess &FromAccess,		phiTransFromMemoryAccessTo(const ExMemoryAccess &FromAccess,
MemoryAccess *ToAccess, const DataLayout &DL,		MemoryAccess *ToAccess, const DataLayout &DL,
DominatorTree &DT, AssumptionCache *AC) {		DominatorTree &DT, AssumptionCache *AC) {
PhiTransPtr ResAddr;		PhiTransPtr ResAddr;
▲ Show 20 Lines • Show All 110 Lines • ▼ Show 20 Lines	struct DSEState {

/// Return 'OW_Complete' if a store to the 'KillingLoc' location (by \p		/// Return 'OW_Complete' if a store to the 'KillingLoc' location (by \p
/// KillingI instruction) completely overwrites a store to the 'DeadLoc'		/// KillingI instruction) completely overwrites a store to the 'DeadLoc'
/// location (by \p DeadI instruction).		/// location (by \p DeadI instruction).
/// Return OW_MaybePartial if \p KillingI does not completely overwrite		/// Return OW_MaybePartial if \p KillingI does not completely overwrite
/// \p DeadI, but they both write to the same underlying object. In that		/// \p DeadI, but they both write to the same underlying object. In that
/// case, use isPartialOverwrite to check if \p KillingI partially overwrites		/// case, use isPartialOverwrite to check if \p KillingI partially overwrites
/// \p DeadI. Returns 'OW_Unknown' if nothing can be determined.		/// \p DeadI. Returns 'OW_Unknown' if nothing can be determined.
		/// Parameters:
		/// KillingI/DeadI - Instructions accessing \p KillingLoc/DeadLoc memory
		/// locations
		/// KillingLoc/DeadLoc - Memory locations under question
		/// KillingOff/DeadOff [in, out] - On input, may provide initial offset of
		/// access relative to KillingLoc/DeadLoc memory location. On output, if
		/// returned value is not "OW_Unknown" will keep absolute offset of access
		/// relative to some common base of KillingLoc and DeadLoc locations.
OverwriteResult isOverwrite(const Instruction *KillingI,		OverwriteResult isOverwrite(const Instruction *KillingI,
const Instruction *DeadI,		const Instruction *DeadI,
const MemoryLocation &KillingLoc,		const MemoryLocation &KillingLoc,
const MemoryLocation &DeadLoc,		const MemoryLocation &DeadLoc,
int64_t &KillingOff, int64_t &DeadOff) {		int64_t &KillingOff, int64_t &DeadOff) {
// AliasAnalysis does not always account for loops. Limit overwrite checks		// AliasAnalysis does not always account for loops. Limit overwrite checks
// to dependencies for which we can guarantee they are independent of any		// to dependencies for which we can guarantee they are independent of any
// loops they are in.		// loops they are in.
if (!isGuaranteedLoopIndependent(DeadI, KillingI, DeadLoc))		if (!isGuaranteedLoopIndependent(DeadI, KillingI, DeadLoc))
return OW_Unknown;		return OW_Unknown;

// FIXME: Vet that this works for size upper-bounds. Seems unlikely that we'll		// FIXME: Vet that this works for size upper-bounds. Seems unlikely that we'll
// get imprecise values here, though (except for unknown sizes).		// get imprecise values here, though (except for unknown sizes).
if (!KillingLoc.Size.isPrecise() \|\| !DeadLoc.Size.isPrecise()) {		if (!KillingLoc.Size.isPrecise() \|\| !DeadLoc.Size.isPrecise()) {
// In case no constant size is known, try to an IR values for the number		// In case no constant size is known, try to an IR values for the number
// of bytes written and check if they match.		// of bytes written and check if they match.
const auto *KillingMemI = dyn_cast<MemIntrinsic>(KillingI);		const auto *KillingMemI = dyn_cast<MemIntrinsic>(KillingI);
const auto *DeadMemI = dyn_cast<MemIntrinsic>(DeadI);		const auto *DeadMemI = dyn_cast<MemIntrinsic>(DeadI);
if (KillingMemI && DeadMemI) {		if (KillingMemI && DeadMemI) {
const Value *KillingV = KillingMemI->getLength();		const Value *KillingV = KillingMemI->getLength();
const Value *DeadV = DeadMemI->getLength();		const Value *DeadV = DeadMemI->getLength();
if (KillingV == DeadV && BatchAA.isMustAlias(DeadLoc, KillingLoc))		if (KillingV == DeadV && KillingOff == DeadOff &&
		BatchAA.isMustAlias(DeadLoc, KillingLoc))
return OW_Complete;		return OW_Complete;
}		}

// Masked stores have imprecise locations, but we can reason about them		// Masked stores have imprecise locations, but we can reason about them
// to some extent.		// to some extent.
return isMaskedStoreOverwrite(KillingI, DeadI, BatchAA);		return isMaskedStoreOverwrite(KillingI, DeadI, BatchAA);
}		}

const uint64_t KillingSize = KillingLoc.Size.getValue();		const uint64_t KillingSize = KillingLoc.Size.getValue();
const uint64_t DeadSize = DeadLoc.Size.getValue();		const uint64_t DeadSize = DeadLoc.Size.getValue();

// Query the alias information		// Query the alias information
AliasResult AAR = BatchAA.alias(KillingLoc, DeadLoc);		AliasResult AAR = BatchAA.alias(KillingLoc, DeadLoc);

// If the start pointers are the same, we just have to compare sizes to see if		// If the start pointers are the same, it's enough to compare sizes and
		fhahnUnsubmitted Not Done Reply Inline Actions This comment needs updating, the if below now handles the must alias and partial alias case. The logic might be easier to follow & document if mustalias/partialalias logic would be kept separate, at the cost of minor code duplication. fhahn: This comment needs updating, the if below now handles the must alias and partial alias case.
// the killing store was larger than the dead store.		// offsets to see if the killing store fully overwrites the dead one.
if (AAR == AliasResult::MustAlias) {		if (AAR == AliasResult::MustAlias \|\|
// Make sure that the KillingSize size is >= the DeadSize size.		(AAR == AliasResult::PartialAlias && AAR.hasOffset() &&
if (KillingSize >= DeadSize)		AAR.getOffset() >= 0)) {
		int64_t AdjEarlierOff =
		DeadOff + (AAR == AliasResult::PartialAlias ? AAR.getOffset() : 0);
		// Make sure that the dead access is "inside" the killing one.
		if (AdjEarlierOff >= KillingOff &&
		uint64_t(AdjEarlierOff - KillingOff) + DeadSize <= KillingSize) {
		DeadOff = AdjEarlierOff;
return OW_Complete;		return OW_Complete;
}		}

// If we hit a partial alias we may have a full overwrite
if (AAR == AliasResult::PartialAlias && AAR.hasOffset()) {
int32_t Off = AAR.getOffset();
if (Off >= 0 && (uint64_t)Off + DeadSize <= KillingSize)
return OW_Complete;
}		}

// Check to see if the killing store is to the entire object (either a		// Check to see if the killing store is to the entire object (either a
// global, an alloca, or a byval/inalloca argument). If so, then it clearly		// global, an alloca, or a byval/inalloca argument). If so, then it clearly
// overwrites any other store to the same object.		// overwrites any other store to the same object.
const Value *DeadPtr = DeadLoc.Ptr->stripPointerCasts();		const Value *DeadPtr = DeadLoc.Ptr->stripPointerCasts();
const Value *KillingPtr = KillingLoc.Ptr->stripPointerCasts();		const Value *KillingPtr = KillingLoc.Ptr->stripPointerCasts();
const Value *DeadUndObj = getUnderlyingObject(DeadPtr);		const Value *DeadUndObj = getUnderlyingObject(DeadPtr);
const Value *KillingUndObj = getUnderlyingObject(KillingPtr);		const Value *KillingUndObj = getUnderlyingObject(KillingPtr);

// If we can't resolve the same pointers to the same object, then we can't		// If we can't resolve the same pointers to the same object, then we can't
// analyze them at all.		// analyze them at all.
if (DeadUndObj != KillingUndObj)		if (DeadUndObj != KillingUndObj)
return OW_Unknown;		return OW_Unknown;

// If the KillingI store is to a recognizable object, get its size.		// If the KillingI store is to a recognizable object, get its size.
uint64_t KillingUndObjSize = getPointerSize(KillingUndObj, DL, TLI, &F);		uint64_t KillingUndObjSize = getPointerSize(KillingUndObj, DL, TLI, &F);
if (KillingUndObjSize != MemoryLocation::UnknownSize)		if (KillingUndObjSize != MemoryLocation::UnknownSize)
if (KillingUndObjSize == KillingSize && KillingUndObjSize >= DeadSize)		if (KillingUndObjSize == KillingSize && KillingUndObjSize >= DeadSize)
return OW_Complete;		return OW_Complete;

// Okay, we have stores to two completely different pointers. Try to		// Okay, we have stores to two completely different pointers. Try to
// decompose the pointer into a "base + constant_offset" form. If the base		// decompose the pointer into a "base + constant_offset" form. If the
// pointers are equal, then we can reason about the two stores.		// base pointers are equal, then we can reason about the two stores.
DeadOff = 0;		int64_t ExtraDeadOff = 0;
KillingOff = 0;		int64_t ExtraKillingOff = 0;
const Value *DeadBasePtr =		const Value *DeadBasePtr =
GetPointerBaseWithConstantOffset(DeadPtr, DeadOff, DL);		GetPointerBaseWithConstantOffset(DeadPtr, ExtraDeadOff, DL);
const Value *KillingBasePtr =		const Value *KillingBasePtr =
GetPointerBaseWithConstantOffset(KillingPtr, KillingOff, DL);		GetPointerBaseWithConstantOffset(KillingPtr, ExtraKillingOff, DL);
		DeadOff += ExtraDeadOff;
		KillingOff += ExtraKillingOff;

// If the base pointers still differ, we have two completely different		// If the base pointers still differ, we have two completely different
// stores.		// stores.
if (DeadBasePtr != KillingBasePtr)		if (DeadBasePtr != KillingBasePtr)
return OW_Unknown;		return OW_Unknown;

// The killing access completely overlaps the dead store if and only if		// The killing access completely overlaps the dead store if and only if
// both start and end of the dead one is "inside" the killing one:		// both start and end of the dead one is "inside" the killing one:
▲ Show 20 Lines • Show All 111 Lines • ▼ Show 20 Lines	bool isCompleteOverwrite(const MemoryLocation &DefLoc, Instruction *DefInst,
// MemoryDef.		// MemoryDef.
if (!UseInst->mayWriteToMemory())		if (!UseInst->mayWriteToMemory())
return false;		return false;

if (auto *CB = dyn_cast<CallBase>(UseInst))		if (auto *CB = dyn_cast<CallBase>(UseInst))
if (CB->onlyAccessesInaccessibleMemory())		if (CB->onlyAccessesInaccessibleMemory())
return false;		return false;

int64_t InstWriteOffset, DepWriteOffset;		int64_t InstWriteOffset = 0;
		int64_t DepWriteOffset = 0;
if (auto CC = getLocForWriteEx(UseInst))		if (auto CC = getLocForWriteEx(UseInst))
return isOverwrite(UseInst, DefInst, *CC, DefLoc, InstWriteOffset,		return isOverwrite(UseInst, DefInst, *CC, DefLoc, InstWriteOffset,
DepWriteOffset) == OW_Complete;		DepWriteOffset) == OW_Complete;
return false;		return false;
}		}

/// Returns true if \p Def is not read before returning from the function.		/// Returns true if \p Def is not read before returning from the function.
bool isWriteAtEndOfFunction(MemoryDef *Def) {		bool isWriteAtEndOfFunction(MemoryDef *Def) {
▲ Show 20 Lines • Show All 317 Lines • ▼ Show 20 Lines	for (;;
continue;		continue;
} else {		} else {
auto &KillingMemLoc = PhiTransKillingLocAndOffset		auto &KillingMemLoc = PhiTransKillingLocAndOffset
? (*PhiTransKillingLocAndOffset).first		? (*PhiTransKillingLocAndOffset).first
: KillingLoc;		: KillingLoc;
int64_t KillingMemOffset = PhiTransKillingLocAndOffset		int64_t KillingMemOffset = PhiTransKillingLocAndOffset
? (*PhiTransKillingLocAndOffset).second		? (*PhiTransKillingLocAndOffset).second
: 0;		: 0;
assert(KillingMemOffset == 0 && "Unexpected non-zero offset");
auto OR = isOverwrite(KillingI, CurrentI, KillingMemLoc, *CurrentLoc,		auto OR = isOverwrite(KillingI, CurrentI, KillingMemLoc, *CurrentLoc,
KillingMemOffset, CurrOffset);		KillingMemOffset, CurrOffset);
// If Current does not write to the same object as KillingDef, check		// If Current does not write to the same object as KillingDef, check
// the next candidate.		// the next candidate.
if (OR == OW_Unknown)		if (OR == OW_Unknown)
continue;		continue;
else if (OR == OW_MaybePartial) {		else if (OR == OW_MaybePartial) {
// If KillingDef only partially overwrites Current, check the next		// If KillingDef only partially overwrites Current, check the next
▲ Show 20 Lines • Show All 560 Lines • ▼ Show 20 Lines	while (!ToCheck.empty()) {
int64_t KillingOffset = 0;		int64_t KillingOffset = 0;
int64_t DeadOffset = 0;		int64_t DeadOffset = 0;

if (ExDeadAccess.second.first.pointsToAliveValue()) {		if (ExDeadAccess.second.first.pointsToAliveValue()) {
KillingLoc = KillingLoc.getWithNewPtr(ExDeadAccess.second.first)		KillingLoc = KillingLoc.getWithNewPtr(ExDeadAccess.second.first)
.getWithoutAATags();		.getWithoutAATags();
KillingOffset = ExDeadAccess.second.second;		KillingOffset = ExDeadAccess.second.second;
}		}
assert(KillingOffset == 0 && "Unexpected non-zero offset");

OverwriteResult OR = State.isOverwrite(		OverwriteResult OR = State.isOverwrite(
KillingI, DeadI, KillingLoc, DeadLoc, KillingOffset, DeadOffset);		KillingI, DeadI, KillingLoc, DeadLoc, KillingOffset, DeadOffset);
if (OR == OW_MaybePartial) {		if (OR == OW_MaybePartial) {
auto Iter = State.IOLs.insert(		auto Iter = State.IOLs.insert(
std::make_pair<BasicBlock *, InstOverlapIntervalsTy>(		std::make_pair<BasicBlock *, InstOverlapIntervalsTy>(
DeadI->getParent(), InstOverlapIntervalsTy()));		DeadI->getParent(), InstOverlapIntervalsTy()));
auto &IOL = Iter.first->second;		auto &IOL = Iter.first->second;
▲ Show 20 Lines • Show All 168 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[DSE][WIP] Enable PHI translation to work through GEPs
Needs ReviewPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 373613

llvm/lib/Transforms/Scalar/DeadStoreElimination.cpp

This is an archive of the discontinued LLVM Phabricator instance.

[DSE][WIP] Enable PHI translation to work through GEPsNeeds ReviewPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 373613

llvm/lib/Transforms/Scalar/DeadStoreElimination.cpp

[DSE][WIP] Enable PHI translation to work through GEPs
Needs ReviewPublic