Diff 440218

llvm/include/llvm/Transforms/Scalar/GVN.h

Show All 29 Lines
#include <vector>		#include <vector>

namespace llvm {		namespace llvm {

class AAResults;		class AAResults;
class AssumeInst;		class AssumeInst;
class AssumptionCache;		class AssumptionCache;
class BasicBlock;		class BasicBlock;
		class BatchAAResults;
class BranchInst;		class BranchInst;
class CallInst;		class CallInst;
class ExtractValueInst;		class ExtractValueInst;
class Function;		class Function;
class FunctionPass;		class FunctionPass;
class GetElementPtrInst;		class GetElementPtrInst;
class ImplicitControlFlowTracking;		class ImplicitControlFlowTracking;
class LoadInst;		class LoadInst;
class LoopInfo;		class LoopInfo;
class MemDepResult;		class MemDepResult;
		class MemoryAccess;
class MemoryDependenceResults;		class MemoryDependenceResults;
		class MemoryLocation;
class MemorySSA;		class MemorySSA;
class MemorySSAUpdater;		class MemorySSAUpdater;
class NonLocalDepResult;		class NonLocalDepResult;
class OptimizationRemarkEmitter;		class OptimizationRemarkEmitter;
class PHINode;		class PHINode;
class TargetLibraryInfo;		class TargetLibraryInfo;
class Value;		class Value;
/// A private "module" namespace for types and utilities used by GVN. These		/// A private "module" namespace for types and utilities used by GVN. These
▲ Show 20 Lines • Show All 148 Lines • ▼ Show 20 Lines	public:

public:		public:
ValueTable();		ValueTable();
ValueTable(const ValueTable &Arg);		ValueTable(const ValueTable &Arg);
ValueTable(ValueTable &&Arg);		ValueTable(ValueTable &&Arg);
~ValueTable();		~ValueTable();
ValueTable &operator=(const ValueTable &Arg);		ValueTable &operator=(const ValueTable &Arg);

		uint32_t lookupOrAdd(MemoryAccess *);
uint32_t lookupOrAdd(Value *V);		uint32_t lookupOrAdd(Value *V);
uint32_t lookup(Value *V, bool Verify = true) const;		uint32_t lookup(Value *V, bool Verify = true) const;
uint32_t lookupOrAddCmp(unsigned Opcode, CmpInst::Predicate Pred,		uint32_t lookupOrAddCmp(unsigned Opcode, CmpInst::Predicate Pred,
Value LHS, Value RHS);		Value LHS, Value RHS);
uint32_t phiTranslate(const BasicBlock BB, const BasicBlock PhiBlock,		uint32_t phiTranslate(const BasicBlock BB, const BasicBlock PhiBlock,
uint32_t Num, GVNPass &Gvn);		uint32_t Num, GVNPass &Gvn);
void eraseTranslateCacheEntry(uint32_t Num, const BasicBlock &CurrBlock);		void eraseTranslateCacheEntry(uint32_t Num, const BasicBlock &CurrBlock);
bool exists(Value *V) const;		bool exists(Value *V) const;
Show All 16 Lines	private:
MemoryDependenceResults *MD = nullptr;		MemoryDependenceResults *MD = nullptr;
DominatorTree *DT = nullptr;		DominatorTree *DT = nullptr;
const TargetLibraryInfo *TLI = nullptr;		const TargetLibraryInfo *TLI = nullptr;
AssumptionCache *AC = nullptr;		AssumptionCache *AC = nullptr;
SetVector<BasicBlock *> DeadBlocks;		SetVector<BasicBlock *> DeadBlocks;
OptimizationRemarkEmitter *ORE = nullptr;		OptimizationRemarkEmitter *ORE = nullptr;
ImplicitControlFlowTracking *ICF = nullptr;		ImplicitControlFlowTracking *ICF = nullptr;
LoopInfo *LI = nullptr;		LoopInfo *LI = nullptr;
		AAResults *AA = nullptr;
MemorySSAUpdater *MSSAU = nullptr;		MemorySSAUpdater *MSSAU = nullptr;

ValueTable VN;		ValueTable VN;

/// A mapping from value numbers to lists of Value*'s that		/// A mapping from value numbers to lists of Value*'s that
/// have that value number. Use findLeader to query it.		/// have that value number. Use findLeader to query it.
struct LeaderTableEntry {		struct LeaderTableEntry {
Value *Val;		Value *Val;
▲ Show 20 Lines • Show All 70 Lines • ▼ Show 20 Lines	if (Prev) {
Curr->Next = Next->Next;		Curr->Next = Next->Next;
}		}
}		}
}		}

// List of critical edges to be split between iterations.		// List of critical edges to be split between iterations.
SmallVector<std::pair<Instruction *, unsigned>, 4> toSplit;		SmallVector<std::pair<Instruction *, unsigned>, 4> toSplit;

		enum class DepKind {
		Other = 0, // Unknown value
		Def, // Exaclty overlapping locations.
		Clobber, // Reaching value superset of needed bits.
		};

		struct ReachingMemVal {
		DepKind Kind;
		BasicBlock *Block;
		const Value *Addr;
		Instruction *Inst;
		int32_t Offset;

		static ReachingMemVal getUnknown(BasicBlock BB, const Value Addr,
		Instruction *Inst = nullptr) {
		return {DepKind::Other, BB, Addr, Inst, -1};
		}

		static ReachingMemVal getDef(const Value Addr, Instruction Inst) {
		return {DepKind::Def, Inst->getParent(), Addr, Inst, -1};
		}

		static ReachingMemVal getClobber(const Value Addr, Instruction Inst,
		int32_t Offset = -1) {
		return {DepKind::Clobber, Inst->getParent(), Addr, Inst, Offset};
		}
		};

		Optional<ReachingMemVal> findReachingValueForLoadInBlock(
		const MemoryLocation &Loc, bool IsInvariantload, BasicBlock *BB,
		Instruction DomLower, Instruction DomUpper, MemoryAccess *ClobberMA,
		MemorySSA &MSSA, BatchAAResults &AA);

		bool findReachingValuesForLoad(LoadInst *Inst, MemorySSA &MSSA, AAResults &AA,
		SmallVectorImpl<ReachingMemVal> &Values);

// Helper functions of redundant load elimination		// Helper functions of redundant load elimination
bool processLoad(LoadInst *L);		bool processLoad(LoadInst *L);
bool processNonLocalLoad(LoadInst *L);		bool processNonLocalLoad(LoadInst *L);
		bool processNonLocalLoad(LoadInst *L, SmallVectorImpl<ReachingMemVal> &Deps);
bool processAssumeIntrinsic(AssumeInst *II);		bool processAssumeIntrinsic(AssumeInst *II);

/// Given a local dependency (Def or Clobber) determine if a value is		/// Given a local dependency (Def or Clobber) determine if a value is
/// available for the load. Returns true if an value is known to be		/// available for the load. Returns true if an value is known to be
/// available and populates Res. Returns false otherwise.		/// available and populates Res. Returns false otherwise.
bool AnalyzeLoadAvailability(LoadInst *Load, MemDepResult DepInfo,		bool AnalyzeLoadAvailability(LoadInst *Load, const ReachingMemVal &Dep,
Value *Address, gvn::AvailableValue &Res);		Value *Address, gvn::AvailableValue &Res);

/// Given a list of non-local dependencies, determine if a value is		/// Given a list of non-local dependencies, determine if a value is
/// available for the load in each specified block. If it is, add it to		/// available for the load in each specified block. If it is, add it to
/// ValuesPerBlock. If not, add it to UnavailableBlocks.		/// ValuesPerBlock. If not, add it to UnavailableBlocks.
void AnalyzeLoadAvailability(LoadInst *Load, LoadDepVect &Deps,		void AnalyzeLoadAvailability(LoadInst *Load,
		SmallVectorImpl<ReachingMemVal> &Deps,
AvailValInBlkVect &ValuesPerBlock,		AvailValInBlkVect &ValuesPerBlock,
UnavailBlkVect &UnavailableBlocks);		UnavailBlkVect &UnavailableBlocks);

bool PerformLoadPRE(LoadInst *Load, AvailValInBlkVect &ValuesPerBlock,		bool PerformLoadPRE(LoadInst *Load, AvailValInBlkVect &ValuesPerBlock,
UnavailBlkVect &UnavailableBlocks);		UnavailBlkVect &UnavailableBlocks);

/// Try to replace a load which executes on each loop iteraiton with Phi		/// Try to replace a load which executes on each loop iteraiton with Phi
/// translation of load in preheader and load(s) in conditionally executed		/// translation of load in preheader and load(s) in conditionally executed
▲ Show 20 Lines • Show All 53 Lines • Show Last 20 Lines

llvm/lib/Transforms/Scalar/GVN.cpp

Show First 20 Lines • Show All 105 Lines • ▼ Show 20 Lines
static cl::opt<bool> GVNEnableLoadInLoopPRE("enable-load-in-loop-pre",		static cl::opt<bool> GVNEnableLoadInLoopPRE("enable-load-in-loop-pre",
cl::init(true));		cl::init(true));
static cl::opt<bool>		static cl::opt<bool>
GVNEnableSplitBackedgeInLoadPRE("enable-split-backedge-in-load-pre",		GVNEnableSplitBackedgeInLoadPRE("enable-split-backedge-in-load-pre",
cl::init(false));		cl::init(false));
static cl::opt<bool> GVNEnableMemDep("enable-gvn-memdep", cl::init(true));		static cl::opt<bool> GVNEnableMemDep("enable-gvn-memdep", cl::init(true));
static cl::opt<bool> GVNEnableMemorySSA("enable-gvn-memoryssa", cl::init(false));		static cl::opt<bool> GVNEnableMemorySSA("enable-gvn-memoryssa", cl::init(false));

		static cl::opt<unsigned> BlockScanLimit(
		"gvn-block-scan-limit", cl::Hidden, cl::init(100),
		cl::desc("The number of memory accesses to scan in a block in reaching "
		"memory values analysis (default = 100)"));

static cl::opt<uint32_t> MaxNumDeps(		static cl::opt<uint32_t> MaxNumDeps(
"gvn-max-num-deps", cl::Hidden, cl::init(100),		"gvn-max-num-deps", cl::Hidden, cl::init(100),
cl::desc("Max number of dependences to attempt Load PRE (default = 100)"));		cl::desc("Max number of dependences to attempt Load PRE (default = 100)"));

// This is based on IsValueFullyAvailableInBlockNumSpeculationsMax stat.		// This is based on IsValueFullyAvailableInBlockNumSpeculationsMax stat.
static cl::opt<uint32_t> MaxBBSpeculations(		static cl::opt<uint32_t> MaxBBSpeculations(
"gvn-max-block-speculations", cl::Hidden, cl::init(600),		"gvn-max-block-speculations", cl::Hidden, cl::init(600),
cl::desc("Max number of blocks we're willing to speculate on (and recurse "		cl::desc("Max number of blocks we're willing to speculate on (and recurse "
▲ Show 20 Lines • Show All 354 Lines • ▼ Show 20 Lines
// * a MemoryPhi, add the value number of the basic block,		// * a MemoryPhi, add the value number of the basic block,
// corresponding to that MemoryPhi		// corresponding to that MemoryPhi
// * a MemoryDef, add the value number of the memory setting		// * a MemoryDef, add the value number of the memory setting
// instruction.		// instruction.
void GVNPass::ValueTable::addMemoryStateArg(Instruction *I, Expression &E) {		void GVNPass::ValueTable::addMemoryStateArg(Instruction *I, Expression &E) {
assert(MSSA && "Function should not be called without MemorySSA");		assert(MSSA && "Function should not be called without MemorySSA");
assert(MSSA->getMemoryAccess(I) && "Instruction does not access memory");		assert(MSSA->getMemoryAccess(I) && "Instruction does not access memory");
MemoryAccess *MA = MSSA->getSkipSelfWalker()->getClobberingMemoryAccess(I);		MemoryAccess *MA = MSSA->getSkipSelfWalker()->getClobberingMemoryAccess(I);
		E.varargs.push_back(lookupOrAdd(MA));
uint32_t N = 0;
if (isa<MemoryPhi>(MA))
N = lookupOrAdd(MA->getBlock());
else if (MSSA->isLiveOnEntryDef(MA))
N = lookupOrAdd(&I->getFunction()->getEntryBlock());
else
N = lookupOrAdd(cast<MemoryDef>(MA)->getMemoryInst());
E.varargs.push_back(N);
}		}

uint32_t GVNPass::ValueTable::lookupOrAddCall(CallInst *C) {		uint32_t GVNPass::ValueTable::lookupOrAddCall(CallInst *C) {
if (AA->doesNotAccessMemory(C)) {		if (AA->doesNotAccessMemory(C)) {
Expression exp = createCallExpr(C);		Expression exp = createCallExpr(C);
uint32_t e = assignExpNewValueNum(exp).first;		uint32_t e = assignExpNewValueNum(exp).first;
valueNumbering[C] = e;		valueNumbering[C] = e;
return e;		return e;
▲ Show 20 Lines • Show All 126 Lines • ▼ Show 20 Lines	uint32_t GVNPass::ValueTable::lookupOrAddLoadStore(Instruction *I) {
return N;		return N;
}		}

/// Returns true if a value number exists for the specified value.		/// Returns true if a value number exists for the specified value.
bool GVNPass::ValueTable::exists(Value *V) const {		bool GVNPass::ValueTable::exists(Value *V) const {
return valueNumbering.count(V) != 0;		return valueNumbering.count(V) != 0;
}		}

		uint32_t GVNPass::ValueTable::lookupOrAdd(MemoryAccess *MA) {
		return MSSA->isLiveOnEntryDef(MA) \|\| isa<MemoryPhi>(MA)
		? lookupOrAdd(MA->getBlock())
		: lookupOrAdd(cast<MemoryUseOrDef>(MA)->getMemoryInst());
		}

/// lookup_or_add - Returns the value number for the specified value, assigning		/// lookup_or_add - Returns the value number for the specified value, assigning
/// it a new number if it did not have one before.		/// it a new number if it did not have one before.
uint32_t GVNPass::ValueTable::lookupOrAdd(Value *V) {		uint32_t GVNPass::ValueTable::lookupOrAdd(Value *V) {
DenseMap<Value*, uint32_t>::iterator VI = valueNumbering.find(V);		DenseMap<Value*, uint32_t>::iterator VI = valueNumbering.find(V);
if (VI != valueNumbering.end())		if (VI != valueNumbering.end())
return VI->second;		return VI->second;

if (!isa<Instruction>(V)) {		if (!isa<Instruction>(V)) {
▲ Show 20 Lines • Show All 433 Lines • ▼ Show 20 Lines	if (CoercedLoad->getType() == LoadTy && Offset == 0) {
Res = CoercedLoad;		Res = CoercedLoad;
} else {		} else {
Res = getLoadValueForLoad(CoercedLoad, Offset, LoadTy, InsertPt, DL);		Res = getLoadValueForLoad(CoercedLoad, Offset, LoadTy, InsertPt, DL);
// We would like to use gvn.markInstructionForDeletion here, but we can't		// We would like to use gvn.markInstructionForDeletion here, but we can't
// because the load is already memoized into the leader map table that GVN		// because the load is already memoized into the leader map table that GVN
// tracks. It is potentially possible to remove the load from the table,		// tracks. It is potentially possible to remove the load from the table,
// but then there all of the operations based on it would need to be		// but then there all of the operations based on it would need to be
// rehashed. Just leave the dead load around.		// rehashed. Just leave the dead load around.
		if (gvn.isMemDepEnabled())
gvn.getMemDep().removeInstruction(CoercedLoad);		gvn.getMemDep().removeInstruction(CoercedLoad);
		chillAuthorUnsubmitted Done Reply Inline Actions Aha, segfault here, I guess. chill: Aha, segfault here, I guess.
LLVM_DEBUG(dbgs() << "GVN COERCED NONLOCAL LOAD:\nOffset: " << Offset		LLVM_DEBUG(dbgs() << "GVN COERCED NONLOCAL LOAD:\nOffset: " << Offset
<< " " << *getCoercedLoadValue() << '\n'		<< " " << *getCoercedLoadValue() << '\n'
<< *Res << '\n'		<< *Res << '\n'
<< "\n\n\n");		<< "\n\n\n");
}		}
} else if (isMemIntrinValue()) {		} else if (isMemIntrinValue()) {
Res = getMemInstValueForLoad(getMemIntrinValue(), Offset, LoadTy,		Res = getMemInstValueForLoad(getMemIntrinValue(), Offset, LoadTy,
InsertPt, DL);		InsertPt, DL);
Show All 33 Lines	if (From->getParent() == Between->getParent())
return DT->dominates(From, Between);		return DT->dominates(From, Between);
SmallSet<BasicBlock *, 1> Exclusion;		SmallSet<BasicBlock *, 1> Exclusion;
Exclusion.insert(Between->getParent());		Exclusion.insert(Between->getParent());
return !isPotentiallyReachable(From, To, &Exclusion, DT);		return !isPotentiallyReachable(From, To, &Exclusion, DT);
}		}

/// Try to locate the three instruction involved in a missed		/// Try to locate the three instruction involved in a missed
/// load-elimination case that is due to an intervening store.		/// load-elimination case that is due to an intervening store.
static void reportMayClobberedLoad(LoadInst *Load, MemDepResult DepInfo,		static void reportMayClobberedLoad(LoadInst Load, Instruction DepInst,
DominatorTree *DT,		DominatorTree *DT,
OptimizationRemarkEmitter *ORE) {		OptimizationRemarkEmitter *ORE) {
using namespace ore;		using namespace ore;

User *OtherAccess = nullptr;		User *OtherAccess = nullptr;

OptimizationRemarkMissed R(DEBUG_TYPE, "LoadClobbered", Load);		OptimizationRemarkMissed R(DEBUG_TYPE, "LoadClobbered", Load);
R << "load of type " << NV("Type", Load->getType()) << " not eliminated"		R << "load of type " << NV("Type", Load->getType()) << " not eliminated"
Show All 38 Lines	for (auto *U : Load->getPointerOperand()->users()) {
}		}
}		}
}		}
}		}

if (OtherAccess)		if (OtherAccess)
R << " in favor of " << NV("OtherAccess", OtherAccess);		R << " in favor of " << NV("OtherAccess", OtherAccess);

R << " because it is clobbered by " << NV("ClobberedBy", DepInfo.getInst());		R << " because it is clobbered by " << NV("ClobberedBy", DepInst);

ORE->emit(R);		ORE->emit(R);
}		}

/// Check if a load from pointer-select \p Address in \p DepBB can be converted		/// Check if a load from pointer-select \p Address in \p DepBB can be converted
/// to a value select. The following conditions need to be satisfied:		/// to a value select. The following conditions need to be satisfied:
/// 1. The pointer select (\p Address) must be defined in \p DepBB.		/// 1. The pointer select (\p Address) must be defined in \p DepBB.
/// 2. Both value operands of the pointer select must be loaded in the same		/// 2. Both value operands of the pointer select must be loaded in the same
Show All 23 Lines	if (any_of(make_range(EarlierLoad->getIterator(), End), [&](Instruction &I) {
return isModSet(AA->getModRefInfo(&I, L1Loc)) \|\|		return isModSet(AA->getModRefInfo(&I, L1Loc)) \|\|
isModSet(AA->getModRefInfo(&I, L2Loc));		isModSet(AA->getModRefInfo(&I, L2Loc));
}))		}))
return None;		return None;

return AvailableValue::getSelect(Sel);		return AvailableValue::getSelect(Sel);
}		}

bool GVNPass::AnalyzeLoadAvailability(LoadInst *Load, MemDepResult DepInfo,		bool GVNPass::AnalyzeLoadAvailability(LoadInst *Load, const ReachingMemVal &Dep,
Value *Address, AvailableValue &Res) {		Value *Address, AvailableValue &Res) {
if (!DepInfo.isDef() && !DepInfo.isClobber()) {		if (Dep.Kind == DepKind::Other) {
assert(isa<SelectInst>(Address));		assert(isa<SelectInst>(Address));
if (auto R = tryToConvertLoadOfPtrSelect(		if (auto R = tryToConvertLoadOfPtrSelect(
Load->getParent(), Load->getIterator(), Address, Load->getType(),		Load->getParent(), Load->getIterator(), Address, Load->getType(),
getDominatorTree(), getAliasAnalysis())) {		getDominatorTree(), getAliasAnalysis())) {
Res = *R;		Res = *R;
return true;		return true;
}		}
return false;		return false;
}		}

assert((DepInfo.isDef() \|\| DepInfo.isClobber()) &&		assert((Dep.Kind == DepKind::Def \|\| Dep.Kind == DepKind::Clobber) &&
"expected a local dependence");		"expected a local dependence");
assert(Load->isUnordered() && "rules below are incorrect for ordered access");		assert(Load->isUnordered() && "rules below are incorrect for ordered access");

const DataLayout &DL = Load->getModule()->getDataLayout();		const DataLayout &DL = Load->getModule()->getDataLayout();

Instruction *DepInst = DepInfo.getInst();		Instruction *DepInst = Dep.Inst;
if (DepInfo.isClobber()) {		if (Dep.Kind == DepKind::Clobber) {
// If the dependence is to a store that writes to a superset of the bits		// If the dependence is to a store that writes to a superset of the bits
// read by the load, we can extract the bits we need for the load from the		// read by the load, we can extract the bits we need for the load from the
// stored value.		// stored value.
if (StoreInst *DepSI = dyn_cast<StoreInst>(DepInst)) {		if (StoreInst *DepSI = dyn_cast<StoreInst>(DepInst)) {
// Can't forward from non-atomic to atomic without violating memory model.		// Can't forward from non-atomic to atomic without violating memory model.
if (Address && Load->isAtomic() <= DepSI->isAtomic()) {		if (Address && Load->isAtomic() <= DepSI->isAtomic()) {
int Offset =		int Offset =
analyzeLoadFromClobberingStore(Load->getType(), Address, DepSI, DL);		analyzeLoadFromClobberingStore(Load->getType(), Address, DepSI, DL);
Show All 10 Lines	if (Dep.Kind == DepKind::Clobber) {
// if we have this, replace the later with an extraction from the former.		// if we have this, replace the later with an extraction from the former.
if (LoadInst *DepLoad = dyn_cast<LoadInst>(DepInst)) {		if (LoadInst *DepLoad = dyn_cast<LoadInst>(DepInst)) {
// If this is a clobber and L is the first instruction in its block, then		// If this is a clobber and L is the first instruction in its block, then
// we have the first instruction in the entry block.		// we have the first instruction in the entry block.
// Can't forward from non-atomic to atomic without violating memory model.		// Can't forward from non-atomic to atomic without violating memory model.
if (DepLoad != Load && Address &&		if (DepLoad != Load && Address &&
Load->isAtomic() <= DepLoad->isAtomic()) {		Load->isAtomic() <= DepLoad->isAtomic()) {
Type *LoadType = Load->getType();		Type *LoadType = Load->getType();
int Offset = -1;		int Offset = Dep.Offset;
		if (MD && !MSSAU) {
// If MD reported clobber, check it was nested.		// If MD reported clobber, check it was nested.
if (DepInfo.isClobber() &&		if (canCoerceMustAliasedValueToLoad(DepLoad, LoadType, DL)) {
canCoerceMustAliasedValueToLoad(DepLoad, LoadType, DL)) {
const auto ClobberOff = MD->getClobberOffset(DepLoad);		const auto ClobberOff = MD->getClobberOffset(DepLoad);
// GVN has no deal with a negative offset.		// GVN has no deal with a negative offset.
Offset = (ClobberOff == None \|\| ClobberOff < 0) ? -1 : ClobberOff;		Offset = (ClobberOff == None \|\| ClobberOff < 0) ? -1 : ClobberOff;
}		}
		} else {
		if (!canCoerceMustAliasedValueToLoad(DepLoad, LoadType, DL) \|\|
		Offset < 0)
		Offset = -1;
		}
if (Offset == -1)		if (Offset == -1)
Offset =		Offset =
analyzeLoadFromClobberingLoad(LoadType, Address, DepLoad, DL);		analyzeLoadFromClobberingLoad(LoadType, Address, DepLoad, DL);
if (Offset != -1) {		if (Offset != -1) {
Res = AvailableValue::getLoad(DepLoad, Offset);		Res = AvailableValue::getLoad(DepLoad, Offset);
return true;		return true;
}		}
}		}
Show All 13 Lines	if (Dep.Kind == DepKind::Clobber) {
}		}

// Nothing known about this clobber, have to be conservative		// Nothing known about this clobber, have to be conservative
LLVM_DEBUG(		LLVM_DEBUG(
// fast print dep, using operator<< on instruction is too slow.		// fast print dep, using operator<< on instruction is too slow.
dbgs() << "GVN: load "; Load->printAsOperand(dbgs());		dbgs() << "GVN: load "; Load->printAsOperand(dbgs());
dbgs() << " is clobbered by " << *DepInst << '\n';);		dbgs() << " is clobbered by " << *DepInst << '\n';);
if (ORE->allowExtraAnalysis(DEBUG_TYPE))		if (ORE->allowExtraAnalysis(DEBUG_TYPE))
reportMayClobberedLoad(Load, DepInfo, DT, ORE);		reportMayClobberedLoad(Load, DepInst, DT, ORE);

return false;		return false;
}		}
assert(DepInfo.isDef() && "follows from above");		assert(Dep.Kind == DepKind::Def && "follows from above");

// Loading the alloca -> undef.		// Loading the alloca -> undef.
// Loading immediately after lifetime begin -> undef.		// Loading immediately after lifetime begin -> undef.
if (isa<AllocaInst>(DepInst) \|\| isLifetimeStart(DepInst)) {		if (isa<AllocaInst>(DepInst) \|\| isLifetimeStart(DepInst)) {
Res = AvailableValue::get(UndefValue::get(Load->getType()));		Res = AvailableValue::get(UndefValue::get(Load->getType()));
return true;		return true;
}		}

Show All 37 Lines	bool GVNPass::AnalyzeLoadAvailability(LoadInst *Load, const ReachingMemVal &Dep,
// Unknown def - must be conservative		// Unknown def - must be conservative
LLVM_DEBUG(		LLVM_DEBUG(
// fast print dep, using operator<< on instruction is too slow.		// fast print dep, using operator<< on instruction is too slow.
dbgs() << "GVN: load "; Load->printAsOperand(dbgs());		dbgs() << "GVN: load "; Load->printAsOperand(dbgs());
dbgs() << " has unknown def " << *DepInst << '\n';);		dbgs() << " has unknown def " << *DepInst << '\n';);
return false;		return false;
}		}

void GVNPass::AnalyzeLoadAvailability(LoadInst *Load, LoadDepVect &Deps,		void GVNPass::AnalyzeLoadAvailability(LoadInst *Load,
		SmallVectorImpl<ReachingMemVal> &Deps,
AvailValInBlkVect &ValuesPerBlock,		AvailValInBlkVect &ValuesPerBlock,
UnavailBlkVect &UnavailableBlocks) {		UnavailBlkVect &UnavailableBlocks) {
// Filter out useless results (non-locals, etc). Keep track of the blocks		// Filter out useless results (non-locals, etc). Keep track of the blocks
// where we have a value available in repl, also keep track of whether we see		// where we have a value available in repl, also keep track of whether we see
// dependencies that produce an unknown value for the load (such as a call		// dependencies that produce an unknown value for the load (such as a call
// that could potentially clobber the load).		// that could potentially clobber the load).
unsigned NumDeps = Deps.size();		unsigned NumDeps = Deps.size();
for (unsigned i = 0, e = NumDeps; i != e; ++i) {		for (unsigned i = 0, e = NumDeps; i != e; ++i) {
BasicBlock *DepBB = Deps[i].getBB();		const auto &Dep = Deps[i];
MemDepResult DepInfo = Deps[i].getResult();		BasicBlock *DepBB = Dep.Block;

if (DeadBlocks.count(DepBB)) {		if (DeadBlocks.count(DepBB)) {
// Dead dependent mem-op disguise as a load evaluating the same value		// Dead dependent mem-op disguise as a load evaluating the same value
// as the load in question.		// as the load in question.
ValuesPerBlock.push_back(AvailableValueInBlock::getUndef(DepBB));		ValuesPerBlock.push_back(AvailableValueInBlock::getUndef(Dep.Block));
continue;		continue;
}		}

// The address being loaded in this non-local block may not be the same as		// The address being loaded in this non-local block may not be the same as
// the pointer operand of the load if PHI translation occurs. Make sure		// the pointer operand of the load if PHI translation occurs. Make sure
// to consider the right address.		// to consider the right address.
Value *Address = Deps[i].getAddress();		Value Address = const_cast<Value >(Deps[i].Addr);
		if (Dep.Kind == DepKind::Other) {
if (!DepInfo.isDef() && !DepInfo.isClobber()) {
if (auto R = tryToConvertLoadOfPtrSelect(		if (auto R = tryToConvertLoadOfPtrSelect(
DepBB, DepBB->end(), Address, Load->getType(), getDominatorTree(),		DepBB, DepBB->end(), Address, Load->getType(), getDominatorTree(),
getAliasAnalysis())) {		getAliasAnalysis())) {
ValuesPerBlock.push_back(		ValuesPerBlock.push_back(
AvailableValueInBlock::get(DepBB, std::move(*R)));		AvailableValueInBlock::get(DepBB, std::move(*R)));
continue;		continue;
}		}
UnavailableBlocks.push_back(DepBB);		UnavailableBlocks.push_back(DepBB);
continue;		continue;
}		}

AvailableValue AV;		AvailableValue AV;
if (AnalyzeLoadAvailability(Load, DepInfo, Address, AV)) {		if (AnalyzeLoadAvailability(Load, Dep, Address, AV)) {
// subtlety: because we know this was a non-local dependency, we know		// subtlety: because we know this was a non-local dependency, we know
// it's safe to materialize anywhere between the instruction within		// it's safe to materialize anywhere between the instruction within
// DepInfo and the end of it's block.		// DepInfo and the end of it's block.
ValuesPerBlock.push_back(AvailableValueInBlock::get(DepBB,		ValuesPerBlock.push_back(AvailableValueInBlock::get(DepBB,
std::move(AV)));		std::move(AV)));
} else {		} else {
UnavailableBlocks.push_back(DepBB);		UnavailableBlocks.push_back(DepBB);
}		}
▲ Show 20 Lines • Show All 52 Lines • ▼ Show 20 Lines	for (const auto &AvailableLoad : AvailableLoads) {
// load now lives in a different BB, and we want to avoid a jumpy line		// load now lives in a different BB, and we want to avoid a jumpy line
// table.		// table.
// FIXME: How do we retain source locations without causing poor debugging		// FIXME: How do we retain source locations without causing poor debugging
// behavior?		// behavior?

// Add the newly created load.		// Add the newly created load.
ValuesPerBlock.push_back(		ValuesPerBlock.push_back(
AvailableValueInBlock::get(UnavailableBlock, NewLoad));		AvailableValueInBlock::get(UnavailableBlock, NewLoad));
		if (MD)
MD->invalidateCachedPointerInfo(LoadPtr);		MD->invalidateCachedPointerInfo(LoadPtr);
LLVM_DEBUG(dbgs() << "GVN INSERTED " << *NewLoad << '\n');		LLVM_DEBUG(dbgs() << "GVN INSERTED " << *NewLoad << '\n');
}		}

// Perform PHI construction.		// Perform PHI construction.
Value V = ConstructSSAForLoadSet(Load, ValuesPerBlock, this);		Value V = ConstructSSAForLoadSet(Load, ValuesPerBlock, this);
Load->replaceAllUsesWith(V);		Load->replaceAllUsesWith(V);
if (isa<PHINode>(V))		if (isa<PHINode>(V))
V->takeName(Load);		V->takeName(Load);
if (Instruction *I = dyn_cast<Instruction>(V))		if (Instruction *I = dyn_cast<Instruction>(V))
I->setDebugLoc(Load->getDebugLoc());		I->setDebugLoc(Load->getDebugLoc());
if (V->getType()->isPtrOrPtrVectorTy())		if (MD && V->getType()->isPtrOrPtrVectorTy())
MD->invalidateCachedPointerInfo(V);		MD->invalidateCachedPointerInfo(V);
markInstructionForDeletion(Load);		markInstructionForDeletion(Load);
ORE->emit([&]() {		ORE->emit([&]() {
return OptimizationRemark(DEBUG_TYPE, "LoadPRE", Load)		return OptimizationRemark(DEBUG_TYPE, "LoadPRE", Load)
<< "load eliminated by PRE";		<< "load eliminated by PRE";
});		});
}		}

▲ Show 20 Lines • Show All 334 Lines • ▼ Show 20 Lines
bool GVNPass::processNonLocalLoad(LoadInst *Load) {		bool GVNPass::processNonLocalLoad(LoadInst *Load) {
// non-local speculations are not allowed under asan.		// non-local speculations are not allowed under asan.
if (Load->getParent()->getParent()->hasFnAttribute(		if (Load->getParent()->getParent()->hasFnAttribute(
Attribute::SanitizeAddress) \|\|		Attribute::SanitizeAddress) \|\|
Load->getParent()->getParent()->hasFnAttribute(		Load->getParent()->getParent()->hasFnAttribute(
Attribute::SanitizeHWAddress))		Attribute::SanitizeHWAddress))
return false;		return false;

// Step 1: Find the non-local dependencies of the load.		// Find the non-local dependencies of the load.
LoadDepVect Deps;		LoadDepVect Deps;
MD->getNonLocalPointerDependency(Load, Deps);		MD->getNonLocalPointerDependency(Load, Deps);

// If we had to process more than one hundred blocks to find the		// If we had to process more than one hundred blocks to find the
// dependencies, this load isn't worth worrying about. Optimizing		// dependencies, this load isn't worth worrying about. Optimizing
// it will be too expensive.		// it will be too expensive.
unsigned NumDeps = Deps.size();		unsigned NumDeps = Deps.size();
if (NumDeps > MaxNumDeps)		if (NumDeps > MaxNumDeps)
return false;		return false;

		SmallVector<ReachingMemVal, 64> MemVals;
		for (const NonLocalDepResult &Dep : Deps) {
		Value *Address = Dep.getAddress();
		BasicBlock *BB = Dep.getBB();
		Instruction *Inst = Dep.getResult().getInst();
		if (Dep.getResult().isClobber())
		MemVals.emplace_back(ReachingMemVal::getClobber(Address, Inst));
		else if (Dep.getResult().isDef())
		MemVals.emplace_back(ReachingMemVal::getDef(Address, Inst));
		else
		MemVals.emplace_back(ReachingMemVal::getUnknown(BB, Address, Inst));
		}
		return processNonLocalLoad(Load, MemVals);
		}

		bool GVNPass ::processNonLocalLoad(LoadInst *Load,
		SmallVectorImpl<ReachingMemVal> &Deps) {
// If we had a phi translation failure, we'll have a single entry which is a		// If we had a phi translation failure, we'll have a single entry which is a
// clobber in the current block. Reject this early.		// clobber in the current block. Reject this early.
if (NumDeps == 1 &&		if (Deps.size() == 1 && Deps[0].Kind == DepKind::Other) {
!Deps[0].getResult().isDef() && !Deps[0].getResult().isClobber()) {
LLVM_DEBUG(dbgs() << "GVN: non-local load "; Load->printAsOperand(dbgs());		LLVM_DEBUG(dbgs() << "GVN: non-local load "; Load->printAsOperand(dbgs());
dbgs() << " has unknown dependencies\n";);		dbgs() << " has unknown dependencies\n";);
return false;		return false;
}		}

bool Changed = false;		bool Changed = false;
// If this load follows a GEP, see if we can PRE the indices before analyzing.		// If this load follows a GEP, see if we can PRE the indices before analyzing.
if (GetElementPtrInst *GEP =		if (GetElementPtrInst *GEP =
Show All 28 Lines	if (UnavailableBlocks.empty()) {
if (isa<PHINode>(V))		if (isa<PHINode>(V))
V->takeName(Load);		V->takeName(Load);
if (Instruction *I = dyn_cast<Instruction>(V))		if (Instruction *I = dyn_cast<Instruction>(V))
// If instruction I has debug info, then we should not update it.		// If instruction I has debug info, then we should not update it.
// Also, if I has a null DebugLoc, then it is still potentially incorrect		// Also, if I has a null DebugLoc, then it is still potentially incorrect
// to propagate Load's DebugLoc because Load may not post-dominate I.		// to propagate Load's DebugLoc because Load may not post-dominate I.
if (Load->getDebugLoc() && Load->getParent() == I->getParent())		if (Load->getDebugLoc() && Load->getParent() == I->getParent())
I->setDebugLoc(Load->getDebugLoc());		I->setDebugLoc(Load->getDebugLoc());
if (V->getType()->isPtrOrPtrVectorTy())		if (MD && V->getType()->isPtrOrPtrVectorTy())
MD->invalidateCachedPointerInfo(V);		MD->invalidateCachedPointerInfo(V);
markInstructionForDeletion(Load);		markInstructionForDeletion(Load);
++NumGVNLoad;		++NumGVNLoad;
reportLoadElim(Load, V, ORE);		reportLoadElim(Load, V, ORE);
return true;		return true;
}		}

// Step 4: Eliminate partial redundancy.		// Step 4: Eliminate partial redundancy.
▲ Show 20 Lines • Show All 207 Lines • ▼ Show 20 Lines	bool GVNPass::processAssumeIntrinsic(AssumeInst *IntrinsicI) {
return Changed;		return Changed;
}		}

static void patchAndReplaceAllUsesWith(Instruction I, Value Repl) {		static void patchAndReplaceAllUsesWith(Instruction I, Value Repl) {
patchReplacementInstruction(I, Repl);		patchReplacementInstruction(I, Repl);
I->replaceAllUsesWith(Repl);		I->replaceAllUsesWith(Repl);
}		}

		Optional<GVNPass::ReachingMemVal> GVNPass::findReachingValueForLoadInBlock(
		const MemoryLocation &Loc, bool IsInvariantLoad, BasicBlock *BB,
		Instruction DomLower, Instruction DomUpper, MemoryAccess *ClobberMA,
		MemorySSA &MSSA, BatchAAResults &AA) {

		auto updateChoice = [&](ReachingMemVal &Choice, AliasResult &AR,
		Instruction *Candidate) {
		// TODO: Worth choosing between exact or partial overlap ?
		if (Choice.Kind == DepKind::Other)
		Choice.Inst = Candidate;
		else if (MSSA.locallyDominates(MSSA.getMemoryAccess(Choice.Inst),
		MSSA.getMemoryAccess(Candidate)))
		Choice.Inst = Candidate;
		else
		return;

		if (AR == AliasResult::PartialAlias) {
		Choice.Kind = DepKind::Clobber;
		Choice.Offset = AR.getOffset();
		} else {
		Choice.Kind = DepKind::Def;
		Choice.Offset = -1;
		}
		Choice.Block = Candidate->getParent();
		};

		// Lower bound is inclusive, upper bound is exclusive.
		auto isBetweenBounds = [&](const MemoryUseOrDef *U) {
		if (DomLower == nullptr && DomUpper == nullptr)
		return true;
		MemoryAccess *Lower =
		DomLower == nullptr ? nullptr : MSSA.getMemoryAccess(DomLower);
		if (Lower != nullptr && !MSSA.locallyDominates(Lower, U))
		return false;
		MemoryAccess *Upper =
		DomUpper == nullptr ? nullptr : MSSA.getMemoryAccess(DomUpper);
		return Upper == nullptr \|\| (U != Upper && MSSA.locallyDominates(U, Upper));
		};

		// Return the memory location, accessed by the [masked]load/store instruction
		// `I`, if the instruction could potentially provide a useful value for
		// elimiating the load.
		auto getLoadStoreLocationIfInteresting =
		[&](Instruction *I,
		bool StoresAreInteresting) -> Optional<MemoryLocation> {
		if (auto *L = dyn_cast<LoadInst>(I))
		return MemoryLocation::get(L);

		if (auto *II = dyn_cast<IntrinsicInst>(I)) {
		if (II->getIntrinsicID() == Intrinsic::masked_load)
		return MemoryLocation::getForArgument(II, 0, TLI);
		}

		if (!StoresAreInteresting)
		return None;

		if (auto *S = dyn_cast<StoreInst>(I))
		return MemoryLocation::get(S);

		if (auto *II = dyn_cast<IntrinsicInst>(I)) {
		if (II->getIntrinsicID() == Intrinsic::masked_store)
		return MemoryLocation::getForArgument(II, 1, TLI);
		}

		return None;
		};

		// For all the memory accesses in the block.
		const auto *MemAccessList = MSSA.getBlockAccesses(BB);
		if (MemAccessList == nullptr)
		return None;
		auto ReachingVal = ReachingMemVal::getUnknown(BB, Loc.Ptr);
		unsigned NumAccessesScanned = 0;
		for (const MemoryAccess &MA : *MemAccessList) {
		// We we spent too much time scanning the block, just give up and return
		// an unknown value.
		if (++NumAccessesScanned >= BlockScanLimit)
		return ReachingMemVal::getUnknown(BB, Loc.Ptr);

		auto *UseOrDef = dyn_cast<MemoryUseOrDef>(&MA);
		if (UseOrDef == nullptr)
		continue;

		// We are interested only in loads here, and, in the case of invariant load,
		// in the stores.
		Instruction *I = UseOrDef->getMemoryInst();
		Optional<MemoryLocation> M =
		getLoadStoreLocationIfInteresting(I, IsInvariantLoad);
		if (!M)
		continue;

		// Skip if the use is not within the bounds. Additionally, the uses needs to
		// be dominated by the clobbering memory access.
		if (!isBetweenBounds(UseOrDef) \|\|
		(ClobberMA->getBlock() == BB && !MSSA.locallyDominates(ClobberMA, &MA)))
		continue;

		AliasResult AR = AA.alias(*M, Loc);
		// If the locations do not certainly alias, we cannot possibly infer the
		// following load loads the same value.
		if (AR == AliasResult::NoAlias \|\| AR == AliasResult::MayAlias)
		continue;

		// Locations partially overlap, but neither is a subset of the other, or the
		// second location is before the first.
		if (AR == AliasResult::PartialAlias &&
		(!AR.hasOffset() \|\| AR.getOffset() < 0))
		continue;

		// Locations precisely overlap or the second accesses subset of the bits of
		// the first.
		updateChoice(ReachingVal, AR, I);
		}

		// Found something.
		if (ReachingVal.Kind != DepKind::Other)
		return ReachingVal;

		// If the clobbering access is the entry memory state, continue the search
		// into predecessors, unless the load is from a local object in which case
		// return the allocation instruction.
		if (MSSA.isLiveOnEntryDef(ClobberMA)) {
		auto *Alloc = dyn_cast<AllocaInst>(getUnderlyingObject(Loc.Ptr));
		if (Alloc != nullptr && Alloc->getParent() == BB)
		return ReachingMemVal::getDef(Loc.Ptr, const_cast<AllocaInst *>(Alloc));

		return None;
		}

		// If the clobberring access is a MemoryPhi or in another block, go to
		// predecessors.
		if (ClobberMA->getBlock() != BB \|\| isa<MemoryPhi>(ClobberMA))
		return None;

		// Loads from "constant" memory can't be clobbered.
		if (IsInvariantLoad \|\| AA.pointsToConstantMemory(Loc))
		return None;

		Instruction *ClobberInst = cast<MemoryDef>(ClobberMA)->getMemoryInst();
		auto getOrdering = [](const Instruction *I) {
		assert(isa<LoadInst>(I) \|\| isa<StoreInst>(I));
		if (const auto *L = dyn_cast<LoadInst>(I))
		return L->getOrdering();
		return cast<StoreInst>(I)->getOrdering();
		};

		// Check if the clobbering access is a load or a store that we can reuse.
		chillAuthorUnsubmitted Done Reply Inline Actions FIXME: This is way too conservative. chill: FIXME: This is way too conservative.
		if (Optional<MemoryLocation> M =
		getLoadStoreLocationIfInteresting(ClobberInst, true)) {
		AliasResult AR = AA.alias(*M, Loc);
		if (AR == AliasResult::MustAlias)
		return ReachingMemVal::getDef(Loc.Ptr, ClobberInst);

		if (AR == AliasResult::NoAlias) {
		// If the locations do not alias we may still be able to skip over the
		// cloberrring instuction, even if it is atomic.

		// The original load is either non-atomic or unordered. We can reorder
		// these across non-atomic, unordered or monotonic loads or across any
		// store.
		if (!ClobberInst->isAtomic() \|\|
		!isStrongerThan(getOrdering(ClobberInst),
		AtomicOrdering::Monotonic) \|\|
		isa<StoreInst>(ClobberInst))
		return None;
		return ReachingMemVal::getClobber(Loc.Ptr, ClobberInst);
		}

		// Skip over volatile loads (the orignal load is non-volatile, non-atomic).
		if (!ClobberInst->isAtomic() && isa<LoadInst>(ClobberInst))
		return None;

		if (AR == AliasResult::MayAlias \|\|
		(AR == AliasResult::PartialAlias &&
		(!AR.hasOffset() \|\| AR.getOffset() < 0)))
		return ReachingMemVal::getClobber(Loc.Ptr, ClobberInst);

		// The only option left is a store of the superset of the required bits.
		assert(AR == AliasResult::PartialAlias && AR.hasOffset() &&
		AR.getOffset() > 0 && "Follows from the conditions above");
		return ReachingMemVal::getClobber(Loc.Ptr, ClobberInst, AR.getOffset());
		}

		if (const IntrinsicInst *II = dyn_cast<IntrinsicInst>(ClobberInst)) {
		if (isa<DbgInfoIntrinsic>(II))
		return None;
		if (II->getIntrinsicID() == Intrinsic::lifetime_start) {
		MemoryLocation M = MemoryLocation::getForArgument(II, 1, TLI);
		if (AA.isMustAlias(M, Loc))
		return ReachingMemVal::getDef(Loc.Ptr, ClobberInst);
		return None;
		}
		}

		// If we are at a malloc-like function call, we can turn the load into `undef`
		// or zero.
		if (isNoAliasCall(ClobberInst)) {
		const Value *Obj = getUnderlyingObject(Loc.Ptr);
		if (Obj == ClobberInst \|\| AA.isMustAlias(ClobberInst, Loc.Ptr))
		return ReachingMemVal::getDef(Loc.Ptr, ClobberInst);
		}

		// Can reorder loads across a release fence.
		if (auto *Fence = dyn_cast<FenceInst>(ClobberInst)) {
		if (Fence->getOrdering() == AtomicOrdering::Release)
		return None;
		}

		// See if the clobber instruction (e.g. a call) may modify the location.
		ModRefInfo MR = AA.getModRefInfo(ClobberInst, Loc);
		// If modification is possible, analyse deeper, to exclude accesses to
		// non-escaping local allocations.
		if (isModAndRefSet(MR))
		MR = AA.callCapturesBefore(ClobberInst, Loc, DT);
		MR = clearMust(MR);
		if (MR == ModRefInfo::NoModRef \|\| MR == ModRefInfo::Ref)
		return None;

		// Conservatively return unknown value for the load.
		return ReachingMemVal::getClobber(Loc.Ptr, ClobberInst);
		}

		static Instruction findInvariantGroupValue(LoadInst L, DominatorTree &DT) {
		// We consider bitcasts and zero GEPs to be the same pointer value. Start by
		// stripping bitcasts and zero GEPs, then we will recursively look at loads
		// and stores through bitcasts and zero GEPs.
		Value *PointerOperand = L->getPointerOperand()->stripPointerCasts();

		// It's not safe to walk the use list of a global value because function
		// passes aren't allowed to look outside their functions.
		// FIXME: this could be fixed by filtering instructions from outside of
		// current function.
		if (isa<Constant>(PointerOperand))
		return nullptr;

		// Queue to process all pointers that are equivalent to load operand.
		SmallVector<Value *, 8> PointerUsesQueue;
		PointerUsesQueue.push_back(PointerOperand);

		Instruction *MostDominatingInstruction = L;

		// FIXME: This loop is O(n^2) because dominates can be O(n) and in worst case
		// we will see all the instructions.
		while (!PointerUsesQueue.empty()) {
		Value *Ptr = PointerUsesQueue.pop_back_val();
		assert(Ptr && !isa<GlobalValue>(Ptr) &&
		"Null or GlobalValue should not be inserted");

		for (User *Us : Ptr->users()) {
		auto *U = dyn_cast<Instruction>(Us);
		if (!U \|\| U == L \|\| !DT.dominates(U, MostDominatingInstruction))
		continue;

		// Add bitcasts and zero GEPs to queue.
		if (isa<BitCastInst>(U)) {
		PointerUsesQueue.push_back(U);
		continue;
		}
		if (auto *GEP = dyn_cast<GetElementPtrInst>(U)) {
		if (GEP->hasAllZeroIndices())
		PointerUsesQueue.push_back(U);
		continue;
		}

		// If we hit a load/store with an invariant.group metadata and the same
		// pointer operand, we can assume that value pointed to by the pointer
		// operand didn't change.
		if (U->hasMetadata(LLVMContext::MD_invariant_group) &&
		getLoadStorePointerOperand(U) == Ptr && !U->isVolatile()) {
		MostDominatingInstruction = U;
		}
		}
		}
		return MostDominatingInstruction == L ? nullptr : MostDominatingInstruction;
		}

		bool GVNPass::findReachingValuesForLoad(
		LoadInst *L, MemorySSA &MSSA, AAResults &AA,
		SmallVectorImpl<ReachingMemVal> &Values) {

		struct WorkItem {
		WorkItem(BasicBlock BB, MemoryAccess ClobberMA, const PHITransAddr &Addr,
		Instruction DomLower, Instruction DomUpper)
		: BB(BB), ClobberMA(ClobberMA), Addr(Addr), DomLower(DomLower),
		DomUpper(DomUpper) {}
		BasicBlock *BB;
		MemoryAccess *ClobberMA;
		PHITransAddr Addr;
		Instruction *DomLower;
		Instruction *DomUpper;
		};
		SmallVector<WorkItem, 32> Worklist;

		// Keep the set of visited blocks, together with the pointer they were visited
		// with. Due to phi-translation, it is possible that we come to a block with a
		// different pointer in which case we set the block we're coming from (a
		// successor of the visited block) as cloberring the memory location in an
		// unknown way.
		DenseMap<BasicBlock , Value > Visited;

		auto collectPredecessors = [&](BasicBlock *BB, const PHITransAddr &Addr,
		MemoryAccess *ClobberMA,
		SmallVectorImpl<WorkItem> &Worklist) -> bool {
		if (Addr.NeedsPHITranslationFromBlock(BB) &&
		!Addr.IsPotentiallyPHITranslatable())
		return false;
		auto *MPhi =
		ClobberMA->getBlock() == BB ? dyn_cast<MemoryPhi>(ClobberMA) : nullptr;
		for (BasicBlock *Pred : predecessors(BB)) {
		if (!DT->isReachableFromEntry(Pred))
		continue;
		PHITransAddr TransAddr = Addr;
		if (TransAddr.NeedsPHITranslationFromBlock(BB))
		TransAddr.PHITranslateValue(BB, Pred, DT, false);
		auto It = Visited.find(Pred);
		if (It != Visited.end()) {
		// If we reach a visited block with a different address, set the
		// current block as clobberring the memory location in an unknown way
		// (by returning false).
		if (It->second != TransAddr.getAddr()) {
		for (const auto &T : Worklist)
		Visited.erase(T.BB);
		return false;
		}
		// Otherwise just stop the traversal.
		continue;
		}
		Visited.insert({Pred, TransAddr.getAddr()});
		Worklist.emplace_back(
		Pred,
		MPhi == nullptr ? ClobberMA : MPhi->getIncomingValueForBlock(Pred),
		TransAddr, Pred == L->getParent() ? L : nullptr, nullptr);
		}
		return true;
		};

		const DataLayout &DL = L->getModule()->getDataLayout();
		auto Loc = MemoryLocation::get(L);
		BasicBlock *StartBlock = L->getParent();
		bool IsInvariantLoad = L->hasMetadata(LLVMContext::MD_invariant_load);
		bool HasSanitizer =
		StartBlock->getParent()->hasFnAttribute(Attribute::SanitizeAddress) \|\|
		StartBlock->getParent()->hasFnAttribute(Attribute::SanitizeHWAddress);
		BatchAAResults BatchAA(AA);

		// Traverse the CFG backwards from the block containing the load instruction,
		// looking for instructions, from which we can deduce what value the load
		// would, well, load. Do a depth-first search with a worklist. Blocks are
		// marked as visited at the time of adding them to the worklist. That allows
		// as to record a block as cloberring the memory location whenever we try to
		// continue the search into a predecessor block for which the phi-translation
		// fails or yields a different pointer. Once exception is the initial block,
		// which is marked visited not when we start the search (next statement
		// below), but when we come to it for a second time via a backedge.
		Worklist.emplace_back(StartBlock,
		MSSA.getMemoryAccess(L)->getDefiningAccess(),
		PHITransAddr(L->getPointerOperand(), DL, AC), nullptr,
		L);
		while (!Worklist.empty()) {
		// If we have found too many blocks so far this load isn't worth worrying
		// about. Optimizing it will be too expensive.
		if (Values.size() > MaxNumDeps)
		return false;

		WorkItem Item = Worklist.back();
		Worklist.pop_back();

		assert((Item.BB == StartBlock && Item.DomLower == nullptr) \|\|
		Visited.count(Item.BB) &&
		"All block in the worklist must be marked as visited (except "
		"the very first block)");
		assert(
		Item.Addr.getAddr() != nullptr &&
		"Blocks with failed phi-translation must not appear on the worklist");

		// If we have found a definite answer (a reusable value or unknown),
		// continue with the next block in the worklist.
		if (Optional<ReachingMemVal> R = findReachingValueForLoadInBlock(
		Loc.getWithNewPtr(Item.Addr.getAddr()), IsInvariantLoad, Item.BB,
		Item.DomLower, Item.DomUpper, Item.ClobberMA, MSSA, BatchAA)) {
		if (R->Kind != DepKind::Def &&
		L->hasMetadata(LLVMContext::MD_invariant_group)) {
		if (Instruction G = findInvariantGroupValue(L, DT))
		R = ReachingMemVal::getDef(getLoadStorePointerOperand(G), G);
		}
		Values.emplace_back(std::move(*R));
		continue;
		}

		// Non-local speculations are not allowed under asan. Note the we can exit
		// from here only on the first iteration of the loop.
		assert((Item.BB == StartBlock \|\| !HasSanitizer) &&
		"Should have exited on the first iteration");
		if (HasSanitizer) {
		Values.emplace_back(ReachingMemVal::getUnknown(Item.BB, Loc.Ptr));
		break;
		}

		// If the clobbering access is in another block, look in the predecessors,
		// keeping the same clobbering access. This also handles the case when the
		// clobbering access is liveOnEntry and we aren't at the entry block.
		// If the clobbering access is a MemoryPhi, look in the predecessors,
		// using the corresponding incoming value for this MemoryPhi as the
		// clobbering access.
		if (Item.ClobberMA->getBlock() != Item.BB \|\|
		isa<MemoryPhi>(Item.ClobberMA)) {
		SmallVector<WorkItem, 4> TmpWorklist;
		if (!collectPredecessors(Item.BB, Item.Addr, Item.ClobberMA,
		TmpWorklist)) {
		Values.push_back(
		ReachingMemVal::getUnknown(Item.BB, Item.Addr.getAddr()));
		continue;
		}
		for (auto &T : TmpWorklist) {
		if (T.Addr.getAddr() == nullptr) {
		// If the phi-translation to a predecessor failed, record the
		// predecessor as a clobber.
		Values.push_back(ReachingMemVal::getUnknown(T.BB, nullptr));
		continue;
		}
		Worklist.push_back(std::move(T));
		}
		continue;
		}

		if (!MSSA.isLiveOnEntryDef(Item.ClobberMA)) {
		// The clobbering access is a normal instruction, that we can
		// nevertheless skip over (e.g. a release fence).
		auto *Def = cast<MemoryUseOrDef>(Item.ClobberMA);
		auto &Last = Worklist.emplace_back(Item);
		Last.ClobberMA = Def->getDefiningAccess();
		continue;
		}

		// If we have liveOnEntry and we are at the entry block, then this block
		// does not provide any useful value for the load.
		Values.emplace_back(ReachingMemVal::getUnknown(Item.BB, Loc.Ptr));
		}

		return true;
		}

/// Attempt to eliminate a load, first by eliminating it		/// Attempt to eliminate a load, first by eliminating it
/// locally, and then attempting non-local elimination if that fails.		/// locally, and then attempting non-local elimination if that fails.
bool GVNPass::processLoad(LoadInst *L) {		bool GVNPass::processLoad(LoadInst *L) {
if (!MD)		if (!MD && !MSSAU)
return false;		return false;

// This code hasn't been audited for ordered or volatile memory access		// This code hasn't been audited for ordered or volatile memory access
if (!L->isUnordered())		if (!L->isUnordered())
return false;		return false;

if (L->use_empty()) {		if (L->use_empty()) {
markInstructionForDeletion(L);		markInstructionForDeletion(L);
return true;		return true;
}		}

		ReachingMemVal MemVal = ReachingMemVal::getUnknown(nullptr, nullptr);
		if (MD && !MSSAU) {
// ... to a pointer that has been loaded from before...		// ... to a pointer that has been loaded from before...
MemDepResult Dep = MD->getDependency(L);		MemDepResult Dep = MD->getDependency(L);

// If it is defined in another block, try harder.		// If it is defined in another block, try harder.
if (Dep.isNonLocal())		if (Dep.isNonLocal())
return processNonLocalLoad(L);		return processNonLocalLoad(L);

Value *Address = L->getPointerOperand();
// Only handle the local case below		// Only handle the local case below
if (!Dep.isDef() && !Dep.isClobber() && !isa<SelectInst>(Address)) {		if (Dep.isDef())
// This might be a NonFuncLocal or an Unknown		MemVal = ReachingMemVal::getDef(L->getPointerOperand(), Dep.getInst());
		else if (Dep.isClobber())
		MemVal =
		ReachingMemVal::getClobber(L->getPointerOperand(), Dep.getInst());
		} else {
		SmallVector<ReachingMemVal, 8> MemVals;
		if (!findReachingValuesForLoad(L, MSSAU->getMemorySSA(), AA, MemVals))
		return false; // Too many dependencies.
		assert(MemVals.size() && "Expected at least an unknown value");
		if (MemVals.size() > 1 \|\| MemVals[0].Block != L->getParent())
		return processNonLocalLoad(L, MemVals);

		// Only handle the local case below
		MemVal = MemVals[0];
		}

		Value *Address = L->getPointerOperand();
		if (MemVal.Kind == DepKind::Other && !isa<SelectInst>(Address)) {
LLVM_DEBUG(		LLVM_DEBUG(
// fast print dep, using operator<< on instruction is too slow.		// fast print dep, using operator<< on instruction is too slow.
dbgs() << "GVN: load "; L->printAsOperand(dbgs());		dbgs() << "GVN: load "; L->printAsOperand(dbgs());
dbgs() << " has unknown dependence\n";);		dbgs() << " has unknown dependence\n";);
return false;		return false;
}		}

AvailableValue AV;		AvailableValue AV;
if (AnalyzeLoadAvailability(L, Dep, Address, AV)) {		if (AnalyzeLoadAvailability(L, MemVal, Address, AV)) {
Value AvailableValue = AV.MaterializeAdjustedValue(L, L, this);		Value AvailableValue = AV.MaterializeAdjustedValue(L, L, this);

// Replace the load!		// Replace the load!
patchAndReplaceAllUsesWith(L, AvailableValue);		patchAndReplaceAllUsesWith(L, AvailableValue);
markInstructionForDeletion(L);		markInstructionForDeletion(L);
if (MSSAU)		if (MSSAU)
MSSAU->removeMemoryAccess(L);		MSSAU->removeMemoryAccess(L);
++NumGVNLoad;		++NumGVNLoad;
▲ Show 20 Lines • Show All 536 Lines • ▼ Show 20 Lines
bool GVNPass::runImpl(Function &F, AssumptionCache &RunAC, DominatorTree &RunDT,		bool GVNPass::runImpl(Function &F, AssumptionCache &RunAC, DominatorTree &RunDT,
const TargetLibraryInfo &RunTLI, AAResults &RunAA,		const TargetLibraryInfo &RunTLI, AAResults &RunAA,
MemoryDependenceResults RunMD, LoopInfo LI,		MemoryDependenceResults RunMD, LoopInfo LI,
OptimizationRemarkEmitter RunORE, MemorySSA MSSA) {		OptimizationRemarkEmitter RunORE, MemorySSA MSSA) {
AC = &RunAC;		AC = &RunAC;
DT = &RunDT;		DT = &RunDT;
VN.setDomTree(DT);		VN.setDomTree(DT);
TLI = &RunTLI;		TLI = &RunTLI;
		AA = &RunAA;
VN.setAliasAnalysis(&RunAA);		VN.setAliasAnalysis(&RunAA);
MD = RunMD;		MD = RunMD;
ImplicitControlFlowTracking ImplicitCFT;		ImplicitControlFlowTracking ImplicitCFT;
ICF = &ImplicitCFT;		ICF = &ImplicitCFT;
this->LI = LI;		this->LI = LI;
VN.setMemDep(MD);		VN.setMemDep(MD);
VN.setMemorySSA(MSSA);		VN.setMemorySSA(MSSA);
ORE = RunORE;		ORE = RunORE;
▲ Show 20 Lines • Show All 593 Lines • ▼ Show 20 Lines	explicit GVNLegacyPass(bool MemDepAnalysis = GVNEnableMemDep,
initializeGVNLegacyPassPass(*PassRegistry::getPassRegistry());		initializeGVNLegacyPassPass(*PassRegistry::getPassRegistry());
}		}

bool runOnFunction(Function &F) override {		bool runOnFunction(Function &F) override {
if (skipFunction(F))		if (skipFunction(F))
return false;		return false;

auto *LIWP = getAnalysisIfAvailable<LoopInfoWrapperPass>();		auto *LIWP = getAnalysisIfAvailable<LoopInfoWrapperPass>();

auto *MSSAWP = getAnalysisIfAvailable<MemorySSAWrapperPass>();
return Impl.runImpl(		return Impl.runImpl(
F, getAnalysis<AssumptionCacheTracker>().getAssumptionCache(F),		F, getAnalysis<AssumptionCacheTracker>().getAssumptionCache(F),
getAnalysis<DominatorTreeWrapperPass>().getDomTree(),		getAnalysis<DominatorTreeWrapperPass>().getDomTree(),
getAnalysis<TargetLibraryInfoWrapperPass>().getTLI(F),		getAnalysis<TargetLibraryInfoWrapperPass>().getTLI(F),
getAnalysis<AAResultsWrapperPass>().getAAResults(),		getAnalysis<AAResultsWrapperPass>().getAAResults(),
Impl.isMemDepEnabled()		Impl.isMemDepEnabled()
? &getAnalysis<MemoryDependenceWrapperPass>().getMemDep()		? &getAnalysis<MemoryDependenceWrapperPass>().getMemDep()
: nullptr,		: nullptr,
LIWP ? &LIWP->getLoopInfo() : nullptr,		LIWP ? &LIWP->getLoopInfo() : nullptr,
&getAnalysis<OptimizationRemarkEmitterWrapperPass>().getORE(),		&getAnalysis<OptimizationRemarkEmitterWrapperPass>().getORE(),
MSSAWP ? &MSSAWP->getMSSA() : nullptr);		Impl.isMemorySSAEnabled()
		? &getAnalysis<MemorySSAWrapperPass>().getMSSA()
		: nullptr);
}		}

void getAnalysisUsage(AnalysisUsage &AU) const override {		void getAnalysisUsage(AnalysisUsage &AU) const override {
AU.addRequired<AssumptionCacheTracker>();		AU.addRequired<AssumptionCacheTracker>();
AU.addRequired<DominatorTreeWrapperPass>();		AU.addRequired<DominatorTreeWrapperPass>();
AU.addRequired<TargetLibraryInfoWrapperPass>();		AU.addRequired<TargetLibraryInfoWrapperPass>();
AU.addRequired<LoopInfoWrapperPass>();		AU.addRequired<LoopInfoWrapperPass>();
if (Impl.isMemDepEnabled())		if (Impl.isMemDepEnabled())
Show All 31 Lines

llvm/test/Analysis/TypeBasedAliasAnalysis/gvn-nonlocal-type-mismatch.ll

; RUN: opt -tbaa -basic-aa -gvn -S < %s \| FileCheck %s		; RUN: opt -tbaa -basic-aa -gvn -S -enable-gvn-memoryssa=false < %s \| FileCheck %s --check-prefixes=CHECK,CHECK-MEMDEP
		; RUN: opt -tbaa -basic-aa -gvn -S -enable-gvn-memoryssa=true < %s \| FileCheck %s --check-prefixes=CHECK,CHECK-MEMSSA

target datalayout = "e-p:64:64:64"		target datalayout = "e-p:64:64:64"

; GVN should ignore the store to p1 to see that the load from p is		; GVN should ignore the store to p1 to see that the load from p is
; fully redundant.		; fully redundant.

; CHECK: @yes		; CHECK: @yes
; CHECK: if.then:		; CHECK: if.then:
Show All 15 Lines	if.else:
ret void		ret void
}		}

; GVN should ignore the store to p1 to see that the first load from p is		; GVN should ignore the store to p1 to see that the first load from p is
; fully redundant. However, the second load uses a different type. Theoretically		; fully redundant. However, the second load uses a different type. Theoretically
; the other type could be unified with the first type, however for now, GVN		; the other type could be unified with the first type, however for now, GVN
; should just be conservative.		; should just be conservative.

		; However, with the MemorySSA changes this no longer happens and GVN optimises
		; it just like in the next function.

; CHECK: @watch_out_for_type_change		; CHECK: @watch_out_for_type_change
; CHECK: if.then:		; CHECK: if.then:
; CHECK: %t = load i32, i32* %p		; CHECK: %t = load i32, i32* %p
; CHECK: store i32 %t, i32* %q		; CHECK: store i32 %t, i32* %q
; CHECK: ret void		; CHECK: ret void
; CHECK: if.else:		; CHECK: if.else:
; CHECK: %u = load i32, i32* %p		; CHECK-MEMDEP-NEXT: %u = load i32, i32* %p
; CHECK: store i32 %u, i32* %q		; CHECK-MEMDEP-NEXT: store i32 %u, i32* %q
		; CHECK-MEMSSA-NEXT: store i32 0, i32* %q
		; CHECK-MEMSSA-NEXT: ret void

define void @watch_out_for_type_change(i1 %c, i32* %p, i32* %p1, i32* %q) nounwind {		define void @watch_out_for_type_change(i1 %c, i32* %p, i32* %p1, i32* %q) nounwind {
entry:		entry:
store i32 0, i32* %p, !tbaa !1		store i32 0, i32* %p, !tbaa !1
store i32 1, i32* %p1, !tbaa !2		store i32 1, i32* %p1, !tbaa !2
br i1 %c, label %if.else, label %if.then		br i1 %c, label %if.else, label %if.then

if.then:		if.then:
▲ Show 20 Lines • Show All 48 Lines • Show Last 20 Lines

llvm/test/Transforms/GVN/PRE/rle.ll

	; NOTE: Assertions have been autogenerated by utils/update_test_checks.py			; RUN: opt < %s -data-layout="e-p:32:32:32-p1:16:16:16-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:32:64-f32:32:32-f64:32:64-n8:16:32" -basic-aa -gvn -enable-split-backedge-in-load-pre -enable-gvn-memoryssa=false -S -dce \| FileCheck %s --check-prefixes=CHECK,LE,LE-MEMDEP
	; RUN: opt < %s -data-layout="e-p:32:32:32-p1:16:16:16-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:32:64-f32:32:32-f64:32:64-n8:16:32" -basic-aa -gvn -enable-split-backedge-in-load-pre -S -dce \| FileCheck %s --check-prefixes=CHECK,LE			; RUN: opt < %s -data-layout="e-p:32:32:32-p1:16:16:16-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:32:64-f32:32:32-f64:32:64-n8:16:32" -basic-aa -gvn -enable-split-backedge-in-load-pre -enable-gvn-memoryssa=true -S -dce \| FileCheck %s --check-prefixes=CHECK,LE,LE-MEMSSA
	; RUN: opt < %s -data-layout="E-p:32:32:32-p1:16:16:16-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:32:64-f32:32:32-f64:64:64-n32" -basic-aa -gvn -enable-split-backedge-in-load-pre -S -dce \| FileCheck %s --check-prefixes=CHECK,BE			; RUN: opt < %s -data-layout="E-p:32:32:32-p1:16:16:16-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:32:64-f32:32:32-f64:64:64-n32" -basic-aa -gvn -enable-split-backedge-in-load-pre -enable-gvn-memoryssa=false -S -dce \| FileCheck %s --check-prefixes=CHECK,BE,BE-MEMDEP
				; RUN: opt < %s -data-layout="E-p:32:32:32-p1:16:16:16-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:32:64-f32:32:32-f64:64:64-n32" -basic-aa -gvn -enable-split-backedge-in-load-pre -enable-gvn-memoryssa=true -S -dce \| FileCheck %s --check-prefixes=CHECK,BE,BE-MEMSSA

	;; Trivial RLE test.			;; Trivial RLE test.
	define i32 @test0(i32 %V, i32* %P) {			define i32 @test0(i32 %V, i32* %P) {
	; CHECK-LABEL: @test0(			; CHECK-LABEL: @test0(
	; CHECK-NEXT: store i32 [[V:%.]], i32 [[P:%.*]], align 4			; CHECK-NEXT: store i32 [[V:%.]], i32 [[P:%.*]], align 4
	; CHECK-NEXT: ret i32 [[V]]			; CHECK-NEXT: ret i32 [[V]]
	;			;
	store i32 %V, i32* %P			store i32 %V, i32* %P
	▲ Show 20 Lines • Show All 997 Lines • ▼ Show 20 Lines
	}			}

	define i32 @load_load_partial_alias_cross_block_phi_trans(i8* %P) nounwind {			define i32 @load_load_partial_alias_cross_block_phi_trans(i8* %P) nounwind {
	; CHECK-LABEL: @load_load_partial_alias_cross_block_phi_trans(			; CHECK-LABEL: @load_load_partial_alias_cross_block_phi_trans(
	; CHECK-NEXT: entry:			; CHECK-NEXT: entry:
	; CHECK-NEXT: [[XX:%.]] = bitcast i8 [[P:%.]] to i32			; CHECK-NEXT: [[XX:%.]] = bitcast i8 [[P:%.]] to i32
	; CHECK-NEXT: [[X1:%.]] = load i32, i32 [[XX]], align 4			; CHECK-NEXT: [[X1:%.]] = load i32, i32 [[XX]], align 4
	; CHECK-NEXT: [[CMP:%.*]] = icmp eq i32 [[X1]], 127			; CHECK-NEXT: [[CMP:%.*]] = icmp eq i32 [[X1]], 127
	; LE-NEXT: [[TMP0:%.*]] = lshr i32 [[X1]], 16			; LE-MEMDEP-NEXT: [[TMP0:%.*]] = lshr i32 [[X1]], 16
	; BE-NEXT: [[TMP0:%.*]] = lshr i32 [[X1]], 8			; BE-MEMDEP-NEXT: [[TMP0:%.*]] = lshr i32 [[X1]], 8
				; LE-MEMSSA-NEXT: [[TMP0:%.*]] = lshr i32 [[X1]], 8
				; BE-MEMSSA-NEXT: [[TMP0:%.*]] = lshr i32 [[X1]], 16
	; CHECK-NEXT: [[TMP1:%.*]] = trunc i32 [[TMP0]] to i8			; CHECK-NEXT: [[TMP1:%.*]] = trunc i32 [[TMP0]] to i8
	; LE-NEXT: [[TMP2:%.*]] = lshr i32 [[X1]], 8			; LE-MEMDEP-NEXT: [[TMP2:%.*]] = lshr i32 [[X1]], 8
	; BE-NEXT: [[TMP2:%.*]] = lshr i32 [[X1]], 16			; BE-MEMDEP-NEXT: [[TMP2:%.*]] = lshr i32 [[X1]], 16
				; LE-MEMSSA-NEXT: [[TMP2:%.*]] = lshr i32 [[X1]], 16
				; BE-MEMSSA-NEXT: [[TMP2:%.*]] = lshr i32 [[X1]], 8
	; CHECK-NEXT: [[TMP3:%.*]] = trunc i32 [[TMP2]] to i8			; CHECK-NEXT: [[TMP3:%.*]] = trunc i32 [[TMP2]] to i8
	; CHECK-NEXT: br i1 [[CMP]], label [[IF:%.]], label [[ELSE:%.]]			; CHECK-NEXT: br i1 [[CMP]], label [[IF:%.]], label [[ELSE:%.]]
	; CHECK: if:			; CHECK: if:
	; CHECK-NEXT: br label [[JOIN:%.*]]			; CHECK-NEXT: br label [[JOIN:%.*]]
	; CHECK: else:			; CHECK: else:
	; CHECK-NEXT: br label [[JOIN]]			; CHECK-NEXT: br label [[JOIN]]
	; CHECK: join:			; CHECK: join:
	; CHECK-NEXT: [[TTMP5:%.*]] = phi i8 [ [[TMP3]], [[IF]] ], [ [[TMP1]], [[ELSE]] ]			; LE-MEMDEP-NEXT: [[TTMP5:%.*]] = phi i8 [ [[TMP3]], [[IF]] ], [ [[TMP1]], [[ELSE]] ]
				; BE-MEMDEP-NEXT: [[TTMP5:%.*]] = phi i8 [ [[TMP3]], [[IF]] ], [ [[TMP1]], [[ELSE]] ]
				; LE-MEMSSA-NEXT: [[TTMP5:%.*]] = phi i8 [ [[TMP1]], [[IF]] ], [ [[TMP3]], [[ELSE]] ]
				; BE-MEMSSA-NEXT: [[TTMP5:%.*]] = phi i8 [ [[TMP1]], [[IF]] ], [ [[TMP3]], [[ELSE]] ]
	; CHECK-NEXT: [[CONV6:%.*]] = zext i8 [[TTMP5]] to i32			; CHECK-NEXT: [[CONV6:%.*]] = zext i8 [[TTMP5]] to i32
	; CHECK-NEXT: ret i32 [[CONV6]]			; CHECK-NEXT: ret i32 [[CONV6]]
	; CHECK: if.end:			; CHECK: if.end:
	; CHECK-NEXT: ret i32 52			; CHECK-NEXT: ret i32 52
	;			;
	entry:			entry:
	%xx = bitcast i8* %P to i32*			%xx = bitcast i8* %P to i32*
	%x1 = load i32, i32* %xx, align 4			%x1 = load i32, i32* %xx, align 4
	▲ Show 20 Lines • Show All 238 Lines • ▼ Show 20 Lines
	;			;
	%x = alloca i8**, align 8			%x = alloca i8**, align 8
	store i8** getelementptr inbounds ([5 x i8], [5 x i8]* @_ZTV1X, i64 0, i64 2), i8*** %x, align 8			store i8** getelementptr inbounds ([5 x i8], [5 x i8]* @_ZTV1X, i64 0, i64 2), i8*** %x, align 8
	call void @use() nounwind			call void @use() nounwind
	%DEAD = load i8, i8* %x, align 8			%DEAD = load i8, i8* %x, align 8
	call void @use3(i8* %x, i8 %DEAD) nounwind			call void @use3(i8* %x, i8 %DEAD) nounwind
	ret void			ret void
	}			}


				define i32 @test_nonaliasing_clobber_ma(i1 %c0, i1 %c1, i1 %c2, i1 %c3, i32* noalias %p, i32* %q) {
				; CHECK-LABEL: @test_nonaliasing_clobber_ma(
				; CHECK-LABEL: H:
				; CHECK-NEXT: %v = phi i32 [ %u, %F ], [ 1, %G ]
				A:
				br i1 %c0, label %B, label %C

				B:
				store i32 0, i32* %p
				br label %C

				C:
				br i1 %c1, label %D, label %E

				D:
				store i32 0, i32* %q
				br label %E

				E:
				br i1 %c2, label %F, label %G

				F:
				%u = load i32, i32* %p
				br i1 %c3, label %G, label %H

				G:
				store i32 1, i32* %p
				br label %H

				H:
				%w = phi i32 [%u, %F], [0, %G]
				%v = load i32, i32* %p
				%r = add i32 %w, %v
				ret i32 %r
				}

llvm/test/Transforms/LoopVectorize/X86/metadata-enable.ll

	; NOTE: Assertions have been autogenerated by utils/update_test_checks.py			; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
	; RUN: opt < %s -mcpu=corei7 -passes='default<O1>' -S -unroll-allow-partial=0 \| FileCheck %s --check-prefix=O1			; RUN: opt < %s -mcpu=corei7 -passes='default<O1>' -S -unroll-allow-partial=0 -enable-gvn-memoryssa=false \| FileCheck %s --check-prefix=O1
	; RUN: opt < %s -mcpu=corei7 -passes='default<O2>' -S -unroll-allow-partial=0 \| FileCheck %s --check-prefix=O2			; RUN: opt < %s -mcpu=corei7 -passes='default<O2>' -S -unroll-allow-partial=0 -enable-gvn-memoryssa=false \| FileCheck %s --check-prefix=O2
	; RUN: opt < %s -mcpu=corei7 -passes='default<O3>' -S -unroll-threshold=150 -unroll-allow-partial=0 \| FileCheck %s --check-prefix=O3			; RUN: opt < %s -mcpu=corei7 -passes='default<O3>' -S -unroll-threshold=150 -unroll-allow-partial=0 -enable-gvn-memoryssa=false \| FileCheck %s --check-prefix=O3
	; RUN: opt < %s -mcpu=corei7 -passes='default<O3>' -S -unroll-allow-partial=0 \| FileCheck %s --check-prefix=O3DEFAULT			; RUN: opt < %s -mcpu=corei7 -passes='default<O3>' -S -unroll-allow-partial=0 -enable-gvn-memoryssa=false\| FileCheck %s --check-prefix=O3DEFAULT
	; RUN: opt < %s -mcpu=corei7 -passes='default<Os>' -S -unroll-allow-partial=0 \| FileCheck %s --check-prefix=Os			; RUN: opt < %s -mcpu=corei7 -passes='default<Os>' -S -unroll-allow-partial=0 -enable-gvn-memoryssa=false\| FileCheck %s --check-prefix=Os
	; RUN: opt < %s -mcpu=corei7 -passes='default<Oz>' -S -unroll-allow-partial=0 \| FileCheck %s --check-prefix=Oz			; RUN: opt < %s -mcpu=corei7 -passes='default<Oz>' -S -unroll-allow-partial=0 -enable-gvn-memoryssa=false\| FileCheck %s --check-prefix=Oz
	; RUN: opt < %s -mcpu=corei7 -passes='default<O1>,loop-vectorize' -S -unroll-allow-partial=0 \| FileCheck %s --check-prefix=O1VEC2			; RUN: opt < %s -mcpu=corei7 -passes='default<O1>,loop-vectorize' -S -unroll-allow-partial=0 -enable-gvn-memoryssa=false \| FileCheck %s --check-prefix=O1VEC2
	; RUN: opt < %s -mcpu=corei7 -passes='default<Oz>,loop-vectorize' -S -unroll-allow-partial=0 \| FileCheck %s --check-prefix=OzVEC2			; RUN: opt < %s -mcpu=corei7 -passes='default<Oz>,loop-vectorize' -S -unroll-allow-partial=0 -enable-gvn-memoryssa=false \| FileCheck %s --check-prefix=OzVEC2
	; RUN: opt < %s -mcpu=corei7 -passes='default<O3>' -unroll-threshold=150 -vectorize-loops=false -S -unroll-allow-partial=0 \| FileCheck %s --check-prefix=O3DIS			; RUN: opt < %s -mcpu=corei7 -passes='default<O3>' -unroll-threshold=150 -vectorize-loops=false -S -unroll-allow-partial=0 -enable-gvn-memoryssa=false \| FileCheck %s --check-prefix=O3DIS

	; This file tests the llvm.loop.vectorize.enable metadata forcing			; This file tests the llvm.loop.vectorize.enable metadata forcing
	; vectorization even when optimization levels are too low, or when			; vectorization even when optimization levels are too low, or when
	; vectorization is disabled.			; vectorization is disabled.

	target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64-S128"			target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64-S128"
	target triple = "x86_64-unknown-linux-gnu"			target triple = "x86_64-unknown-linux-gnu"

	▲ Show 20 Lines • Show All 1,945 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[GVN] MemorySSA for GVN: use MemorySSA for redundant loads elimination
Needs ReviewPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 440218

llvm/include/llvm/Transforms/Scalar/GVN.h

llvm/lib/Transforms/Scalar/GVN.cpp

llvm/test/Analysis/TypeBasedAliasAnalysis/gvn-nonlocal-type-mismatch.ll

llvm/test/Transforms/GVN/PRE/rle.ll

llvm/test/Transforms/LoopVectorize/X86/metadata-enable.ll

This is an archive of the discontinued LLVM Phabricator instance.

[GVN] MemorySSA for GVN: use MemorySSA for redundant loads eliminationNeeds ReviewPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 440218

llvm/include/llvm/Transforms/Scalar/GVN.h

llvm/lib/Transforms/Scalar/GVN.cpp

llvm/test/Analysis/TypeBasedAliasAnalysis/gvn-nonlocal-type-mismatch.ll

llvm/test/Transforms/GVN/PRE/rle.ll

llvm/test/Transforms/LoopVectorize/X86/metadata-enable.ll

[GVN] MemorySSA for GVN: use MemorySSA for redundant loads elimination
Needs ReviewPublic