Diff 91139

include/llvm/LinkAllPasses.h

Show First 20 Lines • Show All 87 Lines • ▼ Show 20 Lines	ForcePassLinking() {
(void) llvm::createDeadStoreEliminationPass();		(void) llvm::createDeadStoreEliminationPass();
(void) llvm::createDependenceAnalysisWrapperPass();		(void) llvm::createDependenceAnalysisWrapperPass();
(void) llvm::createDivergenceAnalysisPass();		(void) llvm::createDivergenceAnalysisPass();
(void) llvm::createDomOnlyPrinterPass();		(void) llvm::createDomOnlyPrinterPass();
(void) llvm::createDomPrinterPass();		(void) llvm::createDomPrinterPass();
(void) llvm::createDomOnlyViewerPass();		(void) llvm::createDomOnlyViewerPass();
(void) llvm::createDomViewerPass();		(void) llvm::createDomViewerPass();
(void) llvm::createGCOVProfilerPass();		(void) llvm::createGCOVProfilerPass();
		(void) llvm::createPDSEPass();
(void) llvm::createPGOInstrumentationGenLegacyPass();		(void) llvm::createPGOInstrumentationGenLegacyPass();
(void) llvm::createPGOInstrumentationUseLegacyPass();		(void) llvm::createPGOInstrumentationUseLegacyPass();
(void) llvm::createPGOIndirectCallPromotionLegacyPass();		(void) llvm::createPGOIndirectCallPromotionLegacyPass();
(void) llvm::createInstrProfilingLegacyPass();		(void) llvm::createInstrProfilingLegacyPass();
(void) llvm::createFunctionImportPass();		(void) llvm::createFunctionImportPass();
(void) llvm::createFunctionInliningPass();		(void) llvm::createFunctionInliningPass();
(void) llvm::createAlwaysInlinerLegacyPass();		(void) llvm::createAlwaysInlinerLegacyPass();
(void) llvm::createGlobalDCEPass();		(void) llvm::createGlobalDCEPass();
▲ Show 20 Lines • Show All 120 Lines • Show Last 20 Lines

include/llvm/Transforms/IPO/PassManagerBuilder.h

Show First 20 Lines • Show All 141 Lines • ▼ Show 20 Lines	public:
bool DisableUnrollLoops;		bool DisableUnrollLoops;
bool BBVectorize;		bool BBVectorize;
bool SLPVectorize;		bool SLPVectorize;
bool LoopVectorize;		bool LoopVectorize;
bool RerollLoops;		bool RerollLoops;
bool LoadCombine;		bool LoadCombine;
bool NewGVN;		bool NewGVN;
bool DisableGVNLoadPRE;		bool DisableGVNLoadPRE;
		bool PDSE;
bool VerifyInput;		bool VerifyInput;
bool VerifyOutput;		bool VerifyOutput;
bool MergeFunctions;		bool MergeFunctions;
bool PrepareForLTO;		bool PrepareForLTO;
bool PrepareForThinLTO;		bool PrepareForThinLTO;
bool PerformThinLTO;		bool PerformThinLTO;

/// Enable profile instrumentation pass.		/// Enable profile instrumentation pass.
▲ Show 20 Lines • Show All 56 Lines • Show Last 20 Lines

include/llvm/Transforms/Scalar.h

	Show First 20 Lines • Show All 69 Lines • ▼ Show 20 Lines
	//			//
	// DeadStoreElimination - This pass deletes stores that are post-dominated by			// DeadStoreElimination - This pass deletes stores that are post-dominated by
	// must-aliased stores and are not loaded used between the stores.			// must-aliased stores and are not loaded used between the stores.
	//			//
	FunctionPass *createDeadStoreEliminationPass();			FunctionPass *createDeadStoreEliminationPass();

	//===----------------------------------------------------------------------===//			//===----------------------------------------------------------------------===//
	//			//
				// PDSE - This pass deletes both partially and fully redundant stores.
				//
				FunctionPass *createPDSEPass();

				//===----------------------------------------------------------------------===//
				//
	// AggressiveDCE - This pass uses the SSA based Aggressive DCE algorithm. This			// AggressiveDCE - This pass uses the SSA based Aggressive DCE algorithm. This
	// algorithm assumes instructions are dead until proven otherwise, which makes			// algorithm assumes instructions are dead until proven otherwise, which makes
	// it more successful are removing non-obviously dead instructions.			// it more successful are removing non-obviously dead instructions.
	//			//
	FunctionPass *createAggressiveDCEPass();			FunctionPass *createAggressiveDCEPass();


	//===----------------------------------------------------------------------===//			//===----------------------------------------------------------------------===//
	▲ Show 20 Lines • Show All 478 Lines • Show Last 20 Lines

lib/Transforms/IPO/PassManagerBuilder.cpp

Show First 20 Lines • Show All 68 Lines • ▼ Show 20 Lines

static cl::opt<bool> RunLoadCombine("combine-loads", cl::init(false),		static cl::opt<bool> RunLoadCombine("combine-loads", cl::init(false),
cl::Hidden,		cl::Hidden,
cl::desc("Run the load combining pass"));		cl::desc("Run the load combining pass"));

static cl::opt<bool> RunNewGVN("enable-newgvn", cl::init(false), cl::Hidden,		static cl::opt<bool> RunNewGVN("enable-newgvn", cl::init(false), cl::Hidden,
cl::desc("Run the NewGVN pass"));		cl::desc("Run the NewGVN pass"));

		static cl::opt<bool> RunPDSE("enable-pdse", cl::init(false), cl::Hidden,
		cl::desc("Run with PDSE instead of DSE."));
		mehdi_aminiUnsubmitted Not Done Reply Inline Actions Is "PDSE" supposed to be a well known acronym? I feel that the description could be more friendly with `--help` readers. It also sounds strange to me that "Partial DSE" is "stronger" than "DSE" alone. mehdi_amini: Is "PDSE" supposed to be a well known acronym? I feel that the description could be more…
		davideUnsubmitted Not Done Reply Inline Actions It doesn't to me, at all. See, for example, PRE (partial redundancy elimination) which is stronger than full redundancy elimination (once we agree on the meaning of stronger). davide: It doesn't to me, at all. See, for example, PRE (partial redundancy elimination) which is…
		filcabUnsubmitted Not Done Reply Inline Actions I think it helps if you look at it as (PDS)E, and not as P(DSE) :-) filcab: I think it helps if you look at it as (PDS)E, and not as P(DSE) :-)

static cl::opt<bool>		static cl::opt<bool>
RunSLPAfterLoopVectorization("run-slp-after-loop-vectorization",		RunSLPAfterLoopVectorization("run-slp-after-loop-vectorization",
cl::init(true), cl::Hidden,		cl::init(true), cl::Hidden,
cl::desc("Run the SLP vectorizer (and BB vectorizer) after the Loop "		cl::desc("Run the SLP vectorizer (and BB vectorizer) after the Loop "
"vectorizer instead of before"));		"vectorizer instead of before"));

// Experimental option to use CFL-AA		// Experimental option to use CFL-AA
enum class CFLAAType { None, Steensgaard, Andersen, Both };		enum class CFLAAType { None, Steensgaard, Andersen, Both };
▲ Show 20 Lines • Show All 68 Lines • ▼ Show 20 Lines	PassManagerBuilder::PassManagerBuilder() {
DisableUnitAtATime = false;		DisableUnitAtATime = false;
DisableUnrollLoops = false;		DisableUnrollLoops = false;
BBVectorize = RunBBVectorization;		BBVectorize = RunBBVectorization;
SLPVectorize = RunSLPVectorization;		SLPVectorize = RunSLPVectorization;
LoopVectorize = RunLoopVectorization;		LoopVectorize = RunLoopVectorization;
RerollLoops = RunLoopRerolling;		RerollLoops = RunLoopRerolling;
LoadCombine = RunLoadCombine;		LoadCombine = RunLoadCombine;
NewGVN = RunNewGVN;		NewGVN = RunNewGVN;
		PDSE = RunPDSE;
DisableGVNLoadPRE = false;		DisableGVNLoadPRE = false;
VerifyInput = false;		VerifyInput = false;
VerifyOutput = false;		VerifyOutput = false;
MergeFunctions = false;		MergeFunctions = false;
PrepareForLTO = false;		PrepareForLTO = false;
EnablePGOInstrGen = RunPGOInstrGen;		EnablePGOInstrGen = RunPGOInstrGen;
PGOInstrGen = PGOOutputFile;		PGOInstrGen = PGOOutputFile;
PGOInstrUse = RunPGOInstrUse;		PGOInstrUse = RunPGOInstrUse;
▲ Show 20 Lines • Show All 168 Lines • ▼ Show 20 Lines	void PassManagerBuilder::addFunctionSimplificationPasses(
MPM.add(createBitTrackingDCEPass()); // Delete dead bit computations		MPM.add(createBitTrackingDCEPass()); // Delete dead bit computations

// Run instcombine after redundancy elimination to exploit opportunities		// Run instcombine after redundancy elimination to exploit opportunities
// opened up by them.		// opened up by them.
addInstructionCombiningPass(MPM);		addInstructionCombiningPass(MPM);
addExtensionsToPM(EP_Peephole, MPM);		addExtensionsToPM(EP_Peephole, MPM);
MPM.add(createJumpThreadingPass()); // Thread jumps		MPM.add(createJumpThreadingPass()); // Thread jumps
MPM.add(createCorrelatedValuePropagationPass());		MPM.add(createCorrelatedValuePropagationPass());
MPM.add(createDeadStoreEliminationPass()); // Delete dead stores		MPM.add(PDSE ? createPDSEPass()
		: createDeadStoreEliminationPass()); // Delete dead stores
MPM.add(createLICMPass());		MPM.add(createLICMPass());

addExtensionsToPM(EP_ScalarOptimizerLate, MPM);		addExtensionsToPM(EP_ScalarOptimizerLate, MPM);

if (RerollLoops)		if (RerollLoops)
MPM.add(createLoopRerollPass());		MPM.add(createLoopRerollPass());
if (!RunSLPAfterLoopVectorization) {		if (!RunSLPAfterLoopVectorization) {
if (SLPVectorize)		if (SLPVectorize)
▲ Show 20 Lines • Show All 402 Lines • ▼ Show 20 Lines	void PassManagerBuilder::addLTOOptimizationPasses(legacy::PassManagerBase &PM) {
PM.add(createGlobalsAAWrapperPass()); // IP alias analysis.		PM.add(createGlobalsAAWrapperPass()); // IP alias analysis.

PM.add(createLICMPass()); // Hoist loop invariants.		PM.add(createLICMPass()); // Hoist loop invariants.
PM.add(createMergedLoadStoreMotionPass()); // Merge ld/st in diamonds.		PM.add(createMergedLoadStoreMotionPass()); // Merge ld/st in diamonds.
PM.add(NewGVN ? createNewGVNPass()		PM.add(NewGVN ? createNewGVNPass()
: createGVNPass(DisableGVNLoadPRE)); // Remove redundancies.		: createGVNPass(DisableGVNLoadPRE)); // Remove redundancies.
PM.add(createMemCpyOptPass()); // Remove dead memcpys.		PM.add(createMemCpyOptPass()); // Remove dead memcpys.

// Nuke dead stores.		PM.add(PDSE ? createPDSEPass() // Really nuke dead stores.
PM.add(createDeadStoreEliminationPass());		: createDeadStoreEliminationPass()); // Nuke dead stores.

// More loops are countable; try to optimize them.		// More loops are countable; try to optimize them.
PM.add(createIndVarSimplifyPass());		PM.add(createIndVarSimplifyPass());
PM.add(createLoopDeletionPass());		PM.add(createLoopDeletionPass());
if (EnableLoopInterchange)		if (EnableLoopInterchange)
PM.add(createLoopInterchangePass());		PM.add(createLoopInterchangePass());

if (!DisableUnrollLoops)		if (!DisableUnrollLoops)
▲ Show 20 Lines • Show All 186 Lines • Show Last 20 Lines

lib/Transforms/Scalar/PDSE.cpp

	Show All 31 Lines
	// the true block) and can be made fully redundant by inserting a copy into the			// the true block) and can be made fully redundant by inserting a copy into the
	// false block.			// false block.
	//			//
	// For a gentler introduction to PRE, see:			// For a gentler introduction to PRE, see:
	//			//
	// Partial Redundancy Elimination in SSA Form			// Partial Redundancy Elimination in SSA Form
	// https://doi.org/10.1145/319301.319348			// https://doi.org/10.1145/319301.319348
	//			//
	// Differences between the papers and this implementation:			// - TODO: Handle partial overwrite tracking during the full redundancy
	// - May-throw instructions count as killing occurrences in the factored			// elimination phase.
	// redundancy graph of escaping stores;
	// - TODO: Figure out partial overwrite tracking.
	//			//
	//===----------------------------------------------------------------------===//			//===----------------------------------------------------------------------===//

				#include "llvm/ADT/DenseSet.h"
				#include "llvm/ADT/Statistic.h"
	#include "llvm/Analysis/AliasAnalysis.h"			#include "llvm/Analysis/AliasAnalysis.h"
				#include "llvm/Analysis/CaptureTracking.h"
	#include "llvm/Analysis/GlobalsModRef.h"			#include "llvm/Analysis/GlobalsModRef.h"
				#include "llvm/Analysis/IteratedDominanceFrontier.h"
				#include "llvm/Analysis/MemoryBuiltins.h"
	#include "llvm/Analysis/PostDominators.h"			#include "llvm/Analysis/PostDominators.h"
	#include "llvm/Analysis/TargetLibraryInfo.h"			#include "llvm/Analysis/TargetLibraryInfo.h"
				#include "llvm/Analysis/ValueTracking.h"
				#include "llvm/IR/AssemblyAnnotationWriter.h"
				#include "llvm/IR/IntrinsicInst.h"
	#include "llvm/Pass.h"			#include "llvm/Pass.h"
				#include "llvm/Support/FormattedStream.h"
	#include "llvm/Transforms/Scalar.h"			#include "llvm/Transforms/Scalar.h"
	#include "llvm/Transforms/Scalar/PDSE.h"			#include "llvm/Transforms/Scalar/PDSE.h"
				#include "llvm/Transforms/Utils/BasicBlockUtils.h"
				#include "llvm/Transforms/Utils/Local.h"

				#include <list>

	#define DEBUG_TYPE "pdse"			#define DEBUG_TYPE "pdse"

	using namespace llvm;			using namespace llvm;

				STATISTIC(NumStores, "Number of stores deleted");
				STATISTIC(NumPartialReds, "Number of partial redundancies converted.");

	static cl::opt<bool>			static cl::opt<bool>
	PrintFRG("print-frg", cl::init(false), cl::Hidden,			PrintFRG("print-frg", cl::init(false), cl::Hidden,
	cl::desc("Print the factored redundancy graph of stores."));			cl::desc("Print the factored redundancy graph of stores."));

	namespace {			namespace {
	bool runPDSE(Function &F, AliasAnalysis &AA, const PostDominatorTree &PDT,			// Representations of factored redundancy graph elements.
	const TargetLibraryInfo &TLI) {			enum struct OccTy {
	if (PrintFRG) {			Real,
	DEBUG(dbgs() << "TODO: Print factored redundancy graph.\n");			Lambda,
	return false;			};

				struct RealOcc;
				struct LambdaOcc;

				// Indexes PDSE.Worklist.
				using RedIdx = unsigned;

				struct Occurrence {
				unsigned ID;
				RedIdx Class;
				// ^ Index of the redundancy class that this belongs to.
				OccTy Type;

				const RealOcc *isReal() const {
				return Type == OccTy::Real ? reinterpret_cast<const RealOcc *>(this)
				: nullptr;
				filcabUnsubmitted Not Done Reply Inline Actions `isReal`/`isLambda` sound like they return booleans. Code like `X->isReal()->isLambda()` looks weird. In my opinion, `asReal`/`asLambda` (or similar) would be easier to read (exact same behavior: If they're the type that we're asking for, return the pointer. Otherwise return `nullptr`). filcab: `isReal`/`isLambda` sound like they return booleans. Code like `X->isReal()->isLambda()` looks…
				}

				const LambdaOcc *isLambda() const {
				return Type == OccTy::Lambda ? reinterpret_cast<const LambdaOcc *>(this)
				: nullptr;
				}

				RealOcc *isReal() {
				return Type == OccTy::Real ? reinterpret_cast<RealOcc *>(this) : nullptr;
				}

				LambdaOcc *isLambda() {
				return Type == OccTy::Lambda ? reinterpret_cast<LambdaOcc *>(this)
				: nullptr;
				}

				RedIdx setClass(RedIdx Class_) { return Class = Class_; }
				};

				struct RedClass;

				struct RealOcc final : public Occurrence {
				Instruction *Inst;
				Occurrence *Def;
				Optional<MemoryLocation> KillLoc;

				RealOcc(unsigned ID, Instruction &I)
				: Occurrence{ID, -1u, OccTy::Real}, Inst(&I), KillLoc(None) {}

				RealOcc(unsigned ID, Instruction &I, MemoryLocation &&KillLoc)
				: Occurrence{ID, -1u, OccTy::Real}, Inst(&I), KillLoc(KillLoc) {}

				bool canDSE() const {
				if (auto *SI = dyn_cast<StoreInst>(Inst)) {
				return SI->isUnordered();
				} else if (auto *MI = dyn_cast<MemIntrinsic>(Inst)) {
				return !MI->isVolatile();
	} else {			} else {
	DEBUG(dbgs() << "Dummy PDSE pass.\n");			llvm_unreachable("Unknown real occurrence type.");
				}
				}

				raw_ostream &print(raw_ostream &, const SmallVectorImpl<RedClass> &) const;
				};

				struct LambdaOcc final : public Occurrence {
				struct Operand {
				Occurrence *Inner;

				bool hasRealUse() const { return Inner->isReal(); }

				LambdaOcc *getLambda() {
				return Inner->isReal() ? Inner->isReal()->isLambda() : Inner->isLambda();
				}
				};

				filcabUnsubmitted Not Done Reply Inline Actions This is always called without the second parameter. It seems code would be simpler if you just took a pointer as an argument. filcab: This is always called without the second parameter. It seems code would be simpler if you just…
				struct RealUse {
				RealOcc *Occ;
				BasicBlock *Pred;

				Instruction &getInst() { return *Occ->Inst; }

				const Instruction &getInst() const { return *Occ->Inst; }
				};

				BasicBlock *Block;
				SmallVector<Operand, 4> Defs;
				SmallVector<BasicBlock *, 4> NullDefs;
				SmallVector<RealUse, 4> Uses;
				// ^ All uses that alias or kill this lambda's occurrence class. A necessary
				filcabUnsubmitted Not Done Reply Inline Actions Why `isReal()->isLambda()`? Won't the `isLambda()` always return `nullptr`? (`Type` can't be both `OccTy::Real` and `OccTy::Lambda`) filcab: Why `isReal()->isLambda()`? Won't the `isLambda()` always return `nullptr`? (`Type` can't be…
				// condition for this lambda to be up-safe is that all its uses are the same
				// class.
				SmallVector<std::pair<LambdaOcc , Operand >, 4> LambdaUses;
				// ^ Needed by the lambda refinement phases `CanBeAnt` and `Earlier`.

				// Consult the Kennedy et al. paper for these.
				bool UpSafe;
				bool CanBeAnt;
				bool Earlier;

				LambdaOcc(BasicBlock &Block, RedIdx Class)
				: Occurrence{-1u, Class, OccTy::Lambda}, Block(&Block), Defs(),
				NullDefs(), Uses(), LambdaUses(), UpSafe(true), CanBeAnt(true),
				Earlier(true) {}

				void addUse(RealOcc &Occ, BasicBlock &Pred) { Uses.push_back({&Occ, &Pred}); }

				void addUse(LambdaOcc &L, Operand &Op) { LambdaUses.push_back({&L, &Op}); }

				LambdaOcc &addOperand(BasicBlock &Succ, Occurrence *ReprOcc) {
				if (ReprOcc) {
				Defs.push_back(Operand{ReprOcc});
				if (LambdaOcc *L = Defs.back().getLambda())
				L->addUse(*this, Defs.back());
				} else
				NullDefs.push_back(&Succ);
				return *this;
				}
				davideUnsubmitted Not Done Reply Inline Actions We generally put the comment above the field and not below, can you change those? davide: We generally put the comment above the field and not below, can you change those?

				void resetUpSafe() { UpSafe = false; }

				void resetCanBeAnt() {
				CanBeAnt = false;
				Earlier = false;
				}

				void resetEarlier() { Earlier = false; }

				bool willBeAnt() const { return CanBeAnt && !Earlier; }

				static Value *getStoreOp(Instruction &I) {
				if (auto *SI = dyn_cast<StoreInst>(&I)) {
				return SI->getValueOperand();
				} else if (auto *MI = dyn_cast<MemSetInst>(&I)) {
				return MI->getValue();
				} else if (auto *MI = dyn_cast<MemTransferInst>(&I)) {
				return MI->getRawSource();
				} else {
				llvm_unreachable("Unknown real occurrence type.");
				}
				}

				static Instruction &setStoreOp(Instruction &I, Value &V) {
				if (auto *SI = dyn_cast<StoreInst>(&I)) {
				SI->setOperand(0, &V);
				} else if (auto *MI = dyn_cast<MemSetInst>(&I)) {
				MI->setValue(&V);
				} else if (auto *MI = dyn_cast<MemTransferInst>(&I)) {
				MI->setSource(&V);
				} else {
				llvm_unreachable("Unknown real occurrence type.");
				}
				return I;
	}			}

				// See if this lambda's _\|_ operands can be filled in. This requires that all
				// uses of this lambda are the same instruction type and DSE-able (e.g., not
				// volatile).
				Instruction *createInsertionOcc() {
				if (willBeAnt() && !NullDefs.empty() &&
				all_of(Uses, [](const RealUse &Use) { return Use.Occ->canDSE(); })) {
				if (Uses.size() == 1) {
				// If there's only one use, PRE can happen even if volatile.
				return Uses[0].getInst().clone();
				} else if (Uses.size() > 1) {
				// The closest real occ users must have the same instruction type
				auto Same = [&](const RealUse &Use) {
				return Use.getInst().getOpcode() == Uses[0].getInst().getOpcode();
				};
				dberlinUnsubmitted Not Done Reply Inline Actions FWIW: DenseMap<const BasicBlock , iplist<RealOcc>> will work. Just derive RealOcc from ilist_node<RealOcc> dberlin:* FWIW: DenseMap<const BasicBlock *, iplist<RealOcc>> will work. Just derive RealOcc from…
				if (std::all_of(std::next(Uses.begin()), Uses.end(), Same)) {
				assert(getStoreOp(Uses[0].getInst()) && "Expected store operand.");
				PHINode *P = IRBuilder<>(Block, Block->begin())
				.CreatePHI(getStoreOp(Uses[0].getInst())->getType(),
				Uses.size());
				for (RealUse &Use : Uses)
				P->addIncoming(getStoreOp(Use.getInst()), Use.Pred);
				return &setStoreOp(Uses[0].getInst().clone(), P);
				}
				}
				}
				return nullptr;
				}

				raw_ostream &print(raw_ostream &, const SmallVectorImpl<RedClass> &) const;
				};

				// Factored redundancy graph representation for each maximal group of
				// must-aliasing stores.
				struct RedClass {
				MemoryLocation Loc;
				// ^ The memory location that each RealOcc mods and must-alias.
				SmallVector<RedIdx, 8> Overwrites;
				// ^ Indices of redundancy classes that can DSE this class.
				SmallVector<RedIdx, 8> Interferes;
				// ^ Indices of redundancy classes that alias this class.
				bool Escapes;
				// ^ Upon function unwind, can Loc escape?
				bool Returned;
				// ^ Is Loc returned by the function?
				SmallVector<LambdaOcc *, 8> Lambdas;

				filcabUnsubmitted Not Done Reply Inline Actions We usually comment above the variable. filcab: We usually comment above the variable.
				RedClass(MemoryLocation Loc, bool Escapes, bool Returned)
				filcabUnsubmitted Not Done Reply Inline Actions Did you do any measurements/reasoning for these sizes, btw? (Just asking. No need to worry too much for now) filcab: Did you do any measurements/reasoning for these sizes, btw? (Just asking. No need to worry too…
				: Loc(std::move(Loc)), Escapes(Escapes), Returned(Returned), Lambdas() {}

				private:
				using LambdaStack = SmallVector<LambdaOcc *, 16>;

				// All of the lambda occ refinement phases follow this depth-first structure
				// to propagate some lambda flag from an initial set to the rest of the graph.
				// Consult figures 8 and 10 of Kennedy et al.
				void depthFirst(void (*push)(LambdaOcc &, LambdaStack &),
				bool (*initial)(LambdaOcc &),
				bool (*alreadyTraversed)(LambdaOcc &L)) {
				LambdaStack Stack;

				for (LambdaOcc *L : Lambdas)
				if (initial(*L))
				push(*L, Stack);

				while (!Stack.empty()) {
				LambdaOcc &L = *Stack.pop_back_val();
				if (!alreadyTraversed(L))
				push(L, Stack);
				}
				}

				// If lambda P is repr occ to an operand of lambda Q and:
				// - Q is up-unsafe (i.e., there is a reverse path from Q to function
				// entry
				// that doesn't cross any real occs of Q's class), and
				// - there are no real occs from P to Q,
				// then we can conclude that P is up-unsafe too. We use this to propagate
				// up-unsafety to the rest of the FRG.
				RedClass &propagateUpUnsafe() {
				auto push = [](LambdaOcc &L, LambdaStack &Stack) {
				for (LambdaOcc::Operand &Op : L.Defs)
				if (LambdaOcc *L = Op.Inner->isLambda())
				Stack.push_back(L);
				};
				auto initialCond = [](LambdaOcc &L) { return !L.UpSafe; };
				// If the top entry of the lambda stack is up-unsafe, then it and its
				// operands already been traversed.
				auto &alreadyTraversed = initialCond;

				depthFirst(push, initialCond, alreadyTraversed);
				return *this;
				}

				RedClass &computeCanBeAnt() {
				auto push = [](LambdaOcc &L, LambdaStack &Stack) {
				L.resetCanBeAnt();
				for (auto &LO : L.LambdaUses)
				if (!LO.second->hasRealUse() && !LO.first->UpSafe && LO.first->CanBeAnt)
				Stack.push_back(LO.first);
				};
				auto initialCond = [](LambdaOcc &L) {
				return !L.UpSafe && L.CanBeAnt && !L.NullDefs.empty();
				};
				auto alreadyTraversed = [](LambdaOcc &L) { return !L.CanBeAnt; };

				depthFirst(push, initialCond, alreadyTraversed);
				return *this;
				}

				RedClass &computeEarlier() {
				auto push = [](LambdaOcc &L, LambdaStack &Stack) {
				L.resetEarlier();
				for (auto &LO : L.LambdaUses)
				if (LO.first->Earlier)
				Stack.push_back(LO.first);
				};
				auto initialCond = [](LambdaOcc &L) {
				return L.Earlier && any_of(L.Defs, [](const LambdaOcc::Operand &Op) {
				return Op.hasRealUse();
				});
				};
				auto alreadyTraversed = [](LambdaOcc &L) { return !L.Earlier; };

				depthFirst(push, initialCond, alreadyTraversed);
				return *this;
				}

				public:
				RedClass &willBeAnt() {
				return propagateUpUnsafe().computeCanBeAnt().computeEarlier();
				}

				friend raw_ostream &operator<<(raw_ostream &O, const RedClass &Class) {
				return O << *Class.Loc.Ptr << " x " << Class.Loc.Size;
				}
				};

				raw_ostream &RealOcc::print(raw_ostream &O,
				const SmallVectorImpl<RedClass> &Worklist) const {
				return ID ? (O << "Real @ " << Inst->getParent()->getName() << " ("
				<< Worklist[Class] << ") " << *Inst)
				: (O << "DeadOnExit");
				}

				raw_ostream &LambdaOcc::print(raw_ostream &O,
				const SmallVectorImpl<RedClass> &Worklist) const {
				return O << "Lambda @ " << Block->getName() << " (" << Worklist[Class]
				<< ") [" << (UpSafe ? "U " : "!U ") << (CanBeAnt ? "C " : "!C ")
				<< (Earlier ? "E " : "!E ") << (willBeAnt() ? "W" : "!W") << "]";
				}

				class EscapeTracker {
				const DataLayout &DL;
				const TargetLibraryInfo &TLI;
				DenseSet<const Value *> NonEscapes;
				DenseSet<const Value *> Returns;

				public:
				bool escapesOnUnwind(const Value *V) {
				filcabUnsubmitted Not Done Reply Inline Actions Nit: We can do without the `else` in these. filcab: Nit: We can do without the `else` in these.
				if (NonEscapes.count(V))
				return false;
				if (isa<AllocaInst>(V) \|\|
				(isAllocLikeFn(V, &TLI) && !PointerMayBeCaptured(V, false, true))) {
				NonEscapes.insert(V);
	return false;			return false;
	}			}
				return true;
				}

				bool escapesOnUnwind(const MemoryLocation &Loc) {
				return escapesOnUnwind(GetUnderlyingObject(Loc.Ptr, DL));
				}

				bool returned(const Value *V) const { return Returns.count(V); }

				bool returned(const MemoryLocation &Loc) const {
				return returned(GetUnderlyingObject(Loc.Ptr, DL));
				}

				EscapeTracker(Function &F, const TargetLibraryInfo &TLI)
				: DL(F.getParent()->getDataLayout()), TLI(TLI) {
				// Record non-escaping args.
				for (Argument &Arg : F.args())
				if (Arg.hasByValOrInAllocaAttr())
				NonEscapes.insert(&Arg);

				// Record return values.
				for (BasicBlock &BB : F)
				if (auto *RI = dyn_cast<ReturnInst>(BB.getTerminator()))
				if (Value *RetVal = RI->getReturnValue())
				Returns.insert(GetUnderlyingObject(RetVal, DL));
				}
				};

				class AliasCache {
				const SmallVectorImpl<RedClass> &Worklist;
				DenseMap<std::pair<RedIdx, MemoryLocation>, AliasResult> Aliases;
				// ^ Caches aliases between memcpy-like kill locs with each class.
				SmallVector<SmallVector<AliasResult, 8>, 8> ClassAliases;
				// ^ Caches aliasing info between occurrence classes.
				DenseMap<std::pair<RedIdx, const Instruction *>, ModRefInfo> MRI;
				AliasAnalysis &AA;

				davideUnsubmitted Not Done Reply Inline Actions why a forward list? davide: why a forward list?
				public:
				AliasCache(const SmallVectorImpl<RedClass> &Worklist, AliasAnalysis &AA)
				: Worklist(Worklist), AA(AA) {}

				AliasResult alias(RedIdx A, const MemoryLocation &Loc) {
				auto Key = std::make_pair(A, Loc);
				return Aliases.count(Key) ? Aliases[Key]
				: (Aliases[Key] = AA.alias(Worklist[A].Loc, Loc));
				}

				AliasResult alias(RedIdx A, RedIdx B) {
				return ClassAliases[std::max(A, B)][std::min(A, B)];
				}

				decltype(ClassAliases)::value_type &push() {
				ClassAliases.emplace_back();
				return ClassAliases.back();
				}

				void pop() { ClassAliases.pop_back(); }

				ModRefInfo getModRefInfo(RedIdx A, const Instruction &I) {
				auto Key = std::make_pair(A, &I);
				return MRI.count(Key) ? MRI[Key]
				: (MRI[Key] = AA.getModRefInfo(&I, Worklist[A].Loc));
				}
				};

				using InstOrReal = PointerUnion<Instruction , RealOcc >;

				struct BlockInfo {
				std::list<InstOrReal> Insts;
				std::list<RealOcc> Occs;
				std::list<LambdaOcc> Lambdas;
				};

				struct PDSE {
				Function &F;
				AliasAnalysis &AA;
				davideUnsubmitted Not Done Reply Inline Actions you don't need `else` after `return`. davide: you don't need `else` after `return`.
				PostDominatorTree &PDT;
				const TargetLibraryInfo &TLI;

				unsigned NextID;
				AliasCache AC;
				EscapeTracker Tracker;
				DenseMap<const BasicBlock *, BlockInfo> Blocks;
				SmallVector<Instruction *, 16> DeadStores;
				SmallVector<RedClass, 16> Worklist;
				RealOcc DeadOnExit;
				// ^ A faux occurrence used to detect stores to non-escaping memory that are
				// redundant with respect to function exit.

				PDSE(Function &F, AliasAnalysis &AA, PostDominatorTree &PDT,
				const TargetLibraryInfo &TLI)
				: F(F), AA(AA), PDT(PDT), TLI(TLI), NextID(1), AC(Worklist, AA),
				Tracker(F, TLI), DeadOnExit(0, *F.getEntryBlock().getTerminator()) {}

				// If Inst has the potential to be a DSE candidate, return its write
				// location
				// and a real occurrence wrapper.
				Optional<std::pair<MemoryLocation, RealOcc>> makeRealOcc(Instruction &I) {
				using std::make_pair;
				if (auto *SI = dyn_cast<StoreInst>(&I)) {
				return make_pair(MemoryLocation::get(SI), RealOcc(NextID++, I));
				} else if (auto *MI = dyn_cast<MemSetInst>(&I)) {
				return make_pair(MemoryLocation::getForDest(MI), RealOcc(NextID++, I));
				} else if (auto *MI = dyn_cast<MemTransferInst>(&I)) {
				// memmove, memcpy.
				return make_pair(MemoryLocation::getForDest(MI),
				RealOcc(NextID++, I, MemoryLocation::getForSource(MI)));
				}
				return None;
				}

				RedIdx assignClass(const MemoryLocation &Loc, RealOcc &Occ,
				DenseMap<MemoryLocation, RedIdx> &BelongsToClass) {
				if (BelongsToClass.count(Loc))
				return Occ.setClass(BelongsToClass[Loc]);

				auto &CachedAliases = AC.push();
				for (RedIdx Idx = 0; Idx < Worklist.size(); Idx += 1) {
				RedClass &Class = Worklist[Idx];
				CachedAliases.emplace_back(AA.alias(Class.Loc, Loc));
				if (CachedAliases.back() == MustAlias && Class.Loc.Size == Loc.Size) {
				AC.pop();
				return Occ.setClass(BelongsToClass[Loc] = Idx);
				}
				}

				// Occ doesn't belong to any existing class, so start a new class.
				Worklist.emplace_back(Loc, Tracker.escapesOnUnwind(Loc),
				Tracker.returned(Loc));
				RedIdx NewIdx = BelongsToClass[Worklist.back().Loc] = Worklist.size() - 1;

				// Copy must-aliases and may-alias into Overwrites and Interferes.
				for (RedIdx Idx = 0; Idx < CachedAliases.size(); Idx += 1) {
				if (CachedAliases[Idx] == MustAlias) {
				// Found a class that could either overwrite or be overwritten by the
				// new class.
				if (Worklist[NewIdx].Loc.Size >= Worklist[Idx].Loc.Size)
				Worklist[Idx].Overwrites.push_back(NewIdx);
				else if (Worklist[NewIdx].Loc.Size <= Worklist[Idx].Loc.Size)
				Worklist[NewIdx].Overwrites.push_back(Idx);
				} else if (CachedAliases[Idx] != NoAlias) {
				Worklist[Idx].Interferes.push_back(NewIdx);
				Worklist[NewIdx].Interferes.push_back(Idx);
				}
				}
				return Occ.setClass(NewIdx);
				}

				struct RenameState {
				struct Incoming {
				Occurrence *ReprOcc;
				BasicBlock *LambdaPred;
				// ^ If ReprOcc is a lambda, then this is the predecessor (to the
				// lambda-containing block) that post-doms us.
				};

				SmallVector<Incoming, 16> States;

				RenameState(SmallVectorImpl<RedClass> &Worklist, RealOcc &DeadOnExit)
				: States(Worklist.size()) {
				for (RedIdx Idx = 0; Idx < Worklist.size(); Idx += 1)
				if (!Worklist[Idx].Escapes && !Worklist[Idx].Returned)
				States[Idx] = {&DeadOnExit, nullptr};
				}

				bool live(RedIdx Idx) const { return States[Idx].ReprOcc; }

				LambdaOcc *exposedLambda(RedIdx Idx) const {
				return live(Idx) ? States[Idx].ReprOcc->isLambda() : nullptr;
				}

				RealOcc *exposedRepr(RedIdx Idx) const {
				return live(Idx) ? States[Idx].ReprOcc->isReal() : nullptr;
				}
				};

				void kill(RedIdx Idx, RenameState &S) {
				DEBUG(dbgs() << "Killing class " << Worklist[Idx] << "\n");
				S.States[Idx] = {nullptr, nullptr};
				}

				void updateUpSafety(RedIdx Idx, RenameState &S) {
				if (LambdaOcc *L = S.exposedLambda(Idx)) {
				DEBUG(L->print(dbgs() << "Setting up-unsafe: ", Worklist));
				L->resetUpSafe();
				}
				}

				bool canDSE(RealOcc &Occ, RenameState &S) {
				// Can DSE if post-dommed by an overwrite.
				return Occ.canDSE() && (S.exposedRepr(Occ.Class) \|\|
				any_of(Worklist[Occ.Class].Overwrites,
				[&](RedIdx R) { return S.exposedRepr(R); }));
				}

				void handleRealOcc(RealOcc &Occ, RenameState &S) {
				DEBUG(Occ.print(dbgs() << "Hit a new occ: ", Worklist) << "\n");
				// Occ can't be DSE-ed, so set it as representative of its occ class.
				if (!S.live(Occ.Class))
				S.States[Occ.Class] = RenameState::Incoming{&Occ, nullptr};
				else if (LambdaOcc *L = S.exposedLambda(Occ.Class)) {
				L->addUse(Occ, *S.States[Occ.Class].LambdaPred);
				S.States[Occ.Class] = {&Occ, nullptr};
				}

				// Find out how Occ interacts with incoming occ classes.
				if (!Occ.KillLoc)
				// Has no kill loc. Its store loc is only significant to incoming occ
				// classes with exposed lambdas.
				for (RedIdx Idx : Worklist[Occ.Class].Interferes)
				updateUpSafety(Idx, S);
				else
				// Has a load that could kill some incoming class, in addition to the same
				// store loc interaction above.
				for (RedIdx Idx = 0; Idx < Worklist.size(); Idx += 1)
				if (S.live(Idx) && Idx != Occ.Class) {
				if (AC.alias(Idx, *Occ.KillLoc) != NoAlias) {
				DEBUG(dbgs() << "KillLoc aliases: " << AC.alias(Idx, *Occ.KillLoc)
				<< "\n");
				kill(Idx, S);
				} else if (AC.alias(Idx, Occ.Class)) {
				DEBUG(dbgs() << "Aliases: " << AC.alias(Idx, Occ.Class) << "\n");
				updateUpSafety(Idx, S);
				}
				}
				}

				void handleMayKill(Instruction &I, RenameState &S) {
				for (RedIdx Idx = 0; Idx < S.States.size(); Idx += 1)
				if (S.live(Idx) && Worklist[Idx].Escapes && I.mayThrow()) {
				kill(Idx, S);
				} else if (S.live(Idx)) {
				ModRefInfo MRI = AC.getModRefInfo(Idx, I);
				if (MRI & MRI_Ref)
				// Aliasing load
				kill(Idx, S);
				else if (MRI & MRI_Mod)
				// Aliasing store
				updateUpSafety(Idx, S);
				}
				}

				void dse(Instruction &I) {
				DEBUG(dbgs() << "DSE-ing " << I << " (" << I.getParent()->getName()
				<< ")\n");
				++NumStores;
				DeadStores.push_back(&I);
				}

				RenameState renameBlock(BasicBlock &BB, RenameState S) {
				DEBUG(dbgs() << "Entering block " << BB.getName() << "\n");
				// Record this block if it precedes a lambda block.
				for (RenameState::Incoming &Inc : S.States)
				if (Inc.ReprOcc && Inc.ReprOcc->isLambda() && !Inc.LambdaPred)
				Inc.LambdaPred = &BB;

				// Set repr occs to lambdas, if present.
				for (LambdaOcc &L : Blocks[&BB].Lambdas)
				S.States[L.Class] = {&L, nullptr};

				// Simultaneously rename and DSE in post-order.
				for (InstOrReal &I : reverse(Blocks[&BB].Insts))
				if (auto Occ = I.dyn_cast<RealOcc >()) {
				if (canDSE(*Occ, S))
				dse(*Occ->Inst);
				else
				handleRealOcc(*Occ, S);
				} else
				// Not a real occ, but still a meminst that could kill or alias.
				handleMayKill(I.get<Instruction >(), S);

				// Lambdas directly exposed to reverse-exit are up-unsafe.
				if (&BB == &BB.getParent()->getEntryBlock())
				for (LambdaOcc &L : Blocks[&BB].Lambdas)
				updateUpSafety(L.Class, S);

				// Connect to predecessor lambdas.
				for (BasicBlock *Pred : predecessors(&BB))
				for (LambdaOcc &L : Blocks[Pred].Lambdas)
				L.addOperand(BB, S.States[L.Class].ReprOcc);

				return S;
				}

				void renamePass() {
				struct Entry {
				DomTreeNode *Node;
				DomTreeNode::iterator ChildIt;
				RenameState Inner;
				};

				SmallVector<Entry, 8> Stack;
				RenameState RootState(Worklist, DeadOnExit);
				if (BasicBlock *Root = PDT.getRootNode()->getBlock())
				// Real and unique exit block.
				Stack.push_back({PDT.getRootNode(), PDT.getRootNode()->begin(),
				renameBlock(*Root, RootState)});
				else
				// Multiple exits and/or infinite loops.
				for (DomTreeNode N : PDT.getRootNode())
				Stack.push_back(
				{N, N->begin(), renameBlock(*N->getBlock(), RootState)});

				// Visit blocks in post-dom pre-order
				while (!Stack.empty()) {
				if (Stack.back().ChildIt == Stack.back().Node->end())
				Stack.pop_back();
				else {
				DomTreeNode Cur = Stack.back().ChildIt++;
				if (Cur->begin() != Cur->end())
				Stack.push_back({Cur, Cur->begin(),
				renameBlock(*Cur->getBlock(), Stack.back().Inner)});
				else
				renameBlock(*Cur->getBlock(), Stack.back().Inner);
				}
				}
				}

				void convertPartialReds() {
				// Maps a lambda block successor to either itself or its split edge block.
				DenseMap<BasicBlock , BasicBlock > SplitBlocks;
				for (RedClass &Class : Worklist) {
				// Determine PRE-ability of this class' lambdas.
				Class.willBeAnt();
				for (LambdaOcc *L : Class.Lambdas) {

				DEBUG(L->print(dbgs() << "Trying to PRE ", Worklist) << "\n\tUses:\n");
				for (LambdaOcc::RealUse &Use : L->Uses)
				DEBUG(Use.Occ->print(dbgs() << "\t\t", Worklist) << "\n");

				DEBUG(dbgs() << "\tDefs:\n");
				for (LambdaOcc::Operand &Def : L->Defs) {
				if (RealOcc *Occ = Def.Inner->isReal())
				DEBUG(Occ->print(dbgs() << "\t\t", Worklist));
				else
				DEBUG(Def.getLambda()->print(dbgs() << "\t", Worklist) << "\n");
				}

				if (L->NullDefs.empty()) {
				// Already fully redundant, no PRE needed, trivially DSEs its uses.
				DEBUG(L->print(dbgs(), Worklist) << " is already fully redun\n");
				for (LambdaOcc::RealUse &Use : L->Uses)
				if (Use.Occ->canDSE())
				dse(Use.getInst());
				} else if (Instruction *I = L->createInsertionOcc()) {
				// L is partially redundant and can be PRE-ed.
				DEBUG(L->print(dbgs(), Worklist) << " can be PRE-ed with:\n\t" << *I
				<< "\n");
				for (BasicBlock *Succ : L->NullDefs) {
				if (SplitBlocks.count(Succ))
				Succ = SplitBlocks[Succ];
				else if (BasicBlock *Split = SplitCriticalEdge(L->Block, Succ))
				Succ = SplitBlocks[Succ] = Split;
				else
				Succ = SplitBlocks[Succ] = Succ;
				I->insertBefore(&*Succ->begin());
				DEBUG(dbgs() << "Inserting into " << Succ->getName() << "\n");
				}
				for (LambdaOcc::RealUse &Use : L->Uses) {
				++NumPartialReds;
				dse(Use.getInst());
				}
				}
				}
				}
				}

				bool run() {
				DenseMap<MemoryLocation, RedIdx> BelongsToClass;
				SmallVector<SmallPtrSet<BasicBlock *, 8>, 8> DefBlocks;

				// Collect real occs and track their basic blocks.
				for (BasicBlock &BB : F)
				for (Instruction &I : BB)
				if (auto LocOcc = makeRealOcc(I)) {
				// Found a real occ for this instruction.
				RedIdx Idx =
				assignClass(LocOcc->first, LocOcc->second, BelongsToClass);
				if (Idx + 1 > DefBlocks.size())
				DefBlocks.emplace_back();
				DefBlocks[Idx].insert(&BB);
				Blocks[&BB].Occs.emplace_back(std::move(LocOcc->second));
				Blocks[&BB].Insts.emplace_back(&Blocks[&BB].Occs.back());
				} else if (AA.getModRefInfo(&I))
				Blocks[&BB].Insts.emplace_back(&I);

				// Insert lambdas at reverse IDF of real occs and aliasing loads.
				for (RedIdx Idx = 0; Idx < Worklist.size(); Idx += 1) {
				// Find kill-only blocks.
				for (BasicBlock &BB : F)
				for (InstOrReal &I : Blocks[&BB].Insts) {
				auto Occ = I.dyn_cast<RealOcc >();
				auto II = I.dyn_cast<Instruction >();
				if ((Occ && Occ->KillLoc &&
				AC.alias(Idx, *Occ->KillLoc) != NoAlias) \|\|
				(II && AC.getModRefInfo(Idx, *II) & MRI_Ref)) {
				DefBlocks[Idx].insert(&BB);
				break;
				}
				}

				// Compute lambdas.
				ReverseIDFCalculator RIDF(PDT);
				RIDF.setDefiningBlocks(DefBlocks[Idx]);
				SmallVector<BasicBlock *, 8> LambdaBlocks;
				RIDF.calculate(LambdaBlocks);

				for (BasicBlock *BB : LambdaBlocks) {
				Blocks[BB].Lambdas.emplace_back(*BB, Idx);
				davideUnsubmitted Not Done Reply Inline Actions Can you please describe the `PDT` bug? I'm not really familiar with it (or I call it with another name :) davide: Can you please describe the `PDT` bug? I'm not really familiar with it (or I call it with…
				Worklist[Idx].Lambdas.push_back(&Blocks[BB].Lambdas.back());
				filcabUnsubmitted Not Done Reply Inline Actions Should we assert? filcab: Should we assert?
				DEBUG(Blocks[BB].Lambdas.back().print(dbgs() << "Inserted ", Worklist)
				<< "\n");
				}
				}

				renamePass();
				convertPartialReds();

				// DSE.
				while (!DeadStores.empty()) {
				Instruction *Dead = DeadStores.pop_back_val();
				for (Use &U : Dead->operands()) {
				Instruction *Op = dyn_cast<Instruction>(U);
				U.set(nullptr);
				if (Op && isInstructionTriviallyDead(Op, &TLI))
				DeadStores.push_back(Op);
				}
				Dead->eraseFromParent();
				}

				return true;
				}
				};

	class PDSELegacyPass : public FunctionPass {			class PDSELegacyPass : public FunctionPass {
	public:			public:
	PDSELegacyPass() : FunctionPass(ID) {			PDSELegacyPass() : FunctionPass(ID) {
	initializePDSELegacyPassPass(*PassRegistry::getPassRegistry());			initializePDSELegacyPassPass(*PassRegistry::getPassRegistry());
	}			}

	bool runOnFunction(Function &F) override {			bool runOnFunction(Function &F) override {
	if (skipFunction(F))			if (skipFunction(F))
	return false;			return false;

	return runPDSE(F, getAnalysis<AAResultsWrapperPass>().getAAResults(),			return PDSE(F, getAnalysis<AAResultsWrapperPass>().getAAResults(),
	getAnalysis<PostDominatorTreeWrapperPass>().getPostDomTree(),			getAnalysis<PostDominatorTreeWrapperPass>().getPostDomTree(),
	getAnalysis<TargetLibraryInfoWrapperPass>().getTLI());			getAnalysis<TargetLibraryInfoWrapperPass>().getTLI())
				.run();
	}			}

	void getAnalysisUsage(AnalysisUsage &AU) const override {			void getAnalysisUsage(AnalysisUsage &AU) const override {
	AU.addRequired<PostDominatorTreeWrapperPass>();			AU.addRequired<PostDominatorTreeWrapperPass>();
	AU.addRequired<AAResultsWrapperPass>();			AU.addRequired<AAResultsWrapperPass>();
	AU.addRequired<TargetLibraryInfoWrapperPass>();			AU.addRequired<TargetLibraryInfoWrapperPass>();

	AU.setPreservesCFG();			AU.setPreservesCFG();
	AU.addPreserved<PostDominatorTreeWrapperPass>();
	AU.addPreserved<GlobalsAAWrapperPass>();			AU.addPreserved<GlobalsAAWrapperPass>();
	}			}

	static char ID; // Pass identification, replacement for typeid			static char ID; // Pass identification, replacement for typeid
	};			};
	} // end anonymous namespace			} // end anonymous namespace

	char PDSELegacyPass::ID = 0;			char PDSELegacyPass::ID = 0;

	INITIALIZE_PASS_BEGIN(PDSELegacyPass, "pdse", "Partial Dead Store Elimination",			INITIALIZE_PASS_BEGIN(PDSELegacyPass, "pdse", "Partial Dead Store Elimination",
	false, false)			false, false)
	INITIALIZE_PASS_DEPENDENCY(PostDominatorTreeWrapperPass)			INITIALIZE_PASS_DEPENDENCY(PostDominatorTreeWrapperPass)
	INITIALIZE_PASS_DEPENDENCY(AAResultsWrapperPass)			INITIALIZE_PASS_DEPENDENCY(AAResultsWrapperPass)
	INITIALIZE_PASS_DEPENDENCY(GlobalsAAWrapperPass)			INITIALIZE_PASS_DEPENDENCY(GlobalsAAWrapperPass)
	INITIALIZE_PASS_DEPENDENCY(TargetLibraryInfoWrapperPass)			INITIALIZE_PASS_DEPENDENCY(TargetLibraryInfoWrapperPass)
	INITIALIZE_PASS_END(PDSELegacyPass, "pdse", "Partial Dead Store Elimination",			INITIALIZE_PASS_END(PDSELegacyPass, "pdse", "Partial Dead Store Elimination",
	false, false)			false, false)

	namespace llvm {			namespace llvm {
	PreservedAnalyses PDSEPass::run(Function &F, FunctionAnalysisManager &AM) {			PreservedAnalyses PDSEPass::run(Function &F, FunctionAnalysisManager &AM) {
	if (!runPDSE(F, AM.getResult<AAManager>(F),			if (!PDSE(F, AM.getResult<AAManager>(F),
	AM.getResult<PostDominatorTreeAnalysis>(F),			AM.getResult<PostDominatorTreeAnalysis>(F),
	AM.getResult<TargetLibraryAnalysis>(F)))			AM.getResult<TargetLibraryAnalysis>(F))
				.run())
	return PreservedAnalyses::all();			return PreservedAnalyses::all();

	PreservedAnalyses PA;			PreservedAnalyses PA;
	PA.preserveSet<CFGAnalyses>();			PA.preserveSet<CFGAnalyses>();
	PA.preserve<PostDominatorTreeAnalysis>();
	PA.preserve<GlobalsAA>();			PA.preserve<GlobalsAA>();
	return PA;			return PA;
	}			}

				FunctionPass *createPDSEPass() { return new PDSELegacyPass(); }
	} // end namespace llvm			} // end namespace llvm
				filcabUnsubmitted Not Done Reply Inline Actions Please remove editor-related markup. filcab: Please remove editor-related markup.

test/Transforms/DeadStoreElimination/pdse.ll

This file was added.

				; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
				; RUN: opt -S -pdse %s \| FileCheck %s

				declare void @may_throw()
				declare noalias i8* @malloc(i32)
				declare void @llvm.memcpy.p0i8.p0i8.i64(i8, i8, i64 , i32 , i1 )
				declare void @llvm.memmove.p0i8.p0i8.i64(i8, i8, i64, i32, i1)
				declare void @llvm.memset.p0i8.i64(i8*, i8, i64, i32, i1)

				define void @lo_and_chow(i8* %x, i1 %br0, i1 %br1) {
				; CHECK-LABEL: @lo_and_chow(
				; CHECK-NEXT: bb0:
				; CHECK-NEXT: [[V:%.]] = load i8, i8 [[X:%.*]]
				; CHECK-NEXT: [[V1:%.*]] = add nuw i8 [[V]], 1
				; CHECK-NEXT: br label [[BB1:%.*]]
				; CHECK: bb1:
				; CHECK-NEXT: br i1 [[BR0:%.]], label [[BB2:%.]], label [[BB3:%.*]]
				; CHECK: bb2:
				; CHECK-NEXT: store i8 [[V1]], i8* [[X]]
				; CHECK-NEXT: [[T:%.]] = load i8, i8 [[X]]
				; CHECK-NEXT: br label [[BB3]]
				; CHECK: bb3:
				; CHECK-NEXT: br i1 [[BR1:%.]], label [[BB1]], label [[EXIT:%.]]
				; CHECK: exit:
				; CHECK-NEXT: store i8 [[V1]], i8* [[X]]
				; CHECK-NEXT: ret void
				;
				bb0:
				%v = load i8, i8* %x
				%v1 = add nuw i8 %v, 1
				store i8 %v1, i8* %x
				br label %bb1
				bb1:
				br i1 %br0, label %bb2, label %bb3
				bb2:
				%t = load i8, i8* %x
				br label %bb3
				bb3:
				store i8 %v1, i8* %x
				br i1 %br1, label %bb1, label %exit
				exit:
				ret void
				}

				; demos the self-loop problem in post-dom tree.
				; define void @f(i8* %x) {
				; a:
				; store i8 0, i8* %x
				; switch i8 0, label %b [
				; i8 1, label %c
				; ]
				; b:
				; store i8 1, i8* %x
				; br label %b
				; c:
				; store i8 2, i8* %x
				; br label %d
				; d:
				; br label %d
				; e:
				; store i8 3, i8* %x
				; ret void
				; }
				;
				; define void @g(i8* %a, i8* %b) {
				; bb0:
				; store i8 undef, i8* %b
				; store i8 undef, i8* %a
				; br i1 undef, label %bb1, label %bb2
				; bb1:
				; %tmp0 = load i8, i8* %a
				; ret void
				; bb2:
				; store i8 undef, i8* %a
				; ret void
				; }

				; define void @i(i8* noalias %x, i8* noalias %y, i1 %z) {
				; %whatever = load i8, i8* %x
				; br label %nextblock
				;
				; nextblock:
				; store i8 %whatever, i8* %x
				; store i8 123, i8* %x
				; br i1 %z, label %nextblock, label %fin
				;
				; fin:
				; ret void
				; }

				define i8* @j(i8* %a, i8* %e, i1 %c) {
				; CHECK-LABEL: @j(
				; CHECK-NEXT: bb0:
				; CHECK-NEXT: [[P:%.]] = tail call i8 @malloc(i32 4)
				; CHECK-NEXT: br i1 [[C:%.]], label [[BB1:%.]], label [[BB2:%.*]]
				; CHECK: bb1:
				; CHECK-NEXT: call void @llvm.memmove.p0i8.p0i8.i64(i8* [[A:%.]], i8 nonnull [[E:%.*]], i64 64, i32 8, i1 false)
				; CHECK-NEXT: call void @llvm.memset.p0i8.i64(i8* [[A]], i8 undef, i64 32, i32 8, i1 false)
				; CHECK-NEXT: [[X:%.]] = bitcast i8 [[A]] to i64*
				; CHECK-NEXT: [[Z:%.]] = getelementptr i64, i64 [[X]], i64 1
				; CHECK-NEXT: store i64 undef, i64* [[Z]]
				; CHECK-NEXT: store i8 undef, i8* [[A]]
				; CHECK-NEXT: call void @may_throw()
				; CHECK-NEXT: store i8 0, i8* [[P]]
				; CHECK-NEXT: store i8 undef, i8* [[A]]
				; CHECK-NEXT: br label [[BB3:%.*]]
				; CHECK: bb2:
				; CHECK-NEXT: br label [[BB3]]
				; CHECK: bb3:
				; CHECK-NEXT: ret i8* [[P]]
				;
				bb0:
				%b = alloca i8
				%P = tail call i8* @malloc(i32 4)
				br i1 %c, label %bb1, label %bb2
				bb1:
				call void @llvm.memcpy.p0i8.p0i8.i64(i8* %b, i8* nonnull %a, i64 64, i32 8, i1 false)
				call void @llvm.memmove.p0i8.p0i8.i64(i8* %a, i8* nonnull %e, i64 64, i32 8, i1 false)
				call void @llvm.memset.p0i8.i64(i8* %a, i8 undef, i64 32, i32 8, i1 false)
				%x = bitcast i8* %a to i64*
				%z = getelementptr i64, i64* %x, i64 1
				store i8 undef, i8* %a
				store i64 undef, i64* %z
				store i8 undef, i8* %a
				; ^ future full elim phase should kill this
				store i8 4, i8* %P
				call void @may_throw()
				store i8 0, i8* %P
				store i8 undef, i8* %a
				br label %bb3
				bb2:
				br label %bb3
				bb3:
				ret i8* %P
				}

				define void @aliasing_load_kills(i8* %a) {
				; CHECK-LABEL: @aliasing_load_kills(
				; CHECK-NEXT: bb0:
				; CHECK-NEXT: br label [[BB1:%.*]]
				; CHECK: bb1:
				; CHECK-NEXT: br i1 undef, label [[BB2:%.]], label [[BB3:%.]]
				; CHECK: bb2:
				; CHECK-NEXT: store i8 undef, i8* [[A:%.*]]
				; CHECK-NEXT: br label [[BB4:%.*]]
				; CHECK: bb3:
				; CHECK-NEXT: store i8 undef, i8* [[A]]
				; CHECK-NEXT: [[X:%.]] = load i8, i8 [[A]]
				; CHECK-NEXT: store i8 undef, i8* [[A]]
				; CHECK-NEXT: br label [[BB4]]
				; CHECK: bb4:
				; CHECK-NEXT: ret void
				;
				bb0:
				store i8 undef, i8* %a
				br label %bb1
				bb1:
				store i8 undef, i8* %a
				br i1 undef, label %bb2, label %bb3
				bb2:
				store i8 undef, i8* %a
				br label %bb4
				bb3:
				%x = load i8, i8* %a
				store i8 undef, i8* %a
				br label %bb4
				bb4:
				ret void
				}

				define void @memcpy_example(i8* %a, i8* %b, i1 %br0) {
				; CHECK-LABEL: @memcpy_example(
				; CHECK-NEXT: bb0:
				; CHECK-NEXT: br i1 [[BR0:%.]], label [[BB1:%.]], label [[BB2:%.*]]
				; CHECK: bb1:
				; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i64(i8* [[A:%.]], i8 [[B:%.*]], i64 64, i32 8, i1 false)
				; CHECK-NEXT: br label [[BB3:%.*]]
				; CHECK: bb2:
				; CHECK-NEXT: call void @llvm.memcpy.p0i8.p0i8.i64(i8* [[A]], i8* [[B]], i64 64, i32 8, i1 false)
				; CHECK-NEXT: br label [[BB3]]
				; CHECK: bb3:
				; CHECK-NEXT: ret void
				;
				bb0:
				call void @llvm.memcpy.p0i8.p0i8.i64(i8* %a, i8* %b, i64 64, i32 8, i1 false)
				br i1 %br0, label %bb1, label %bb2
				bb1:
				call void @llvm.memcpy.p0i8.p0i8.i64(i8* %a, i8* %b, i64 64, i32 8, i1 false)
				br label %bb3
				bb2:
				br label %bb3
				bb3:
				ret void
				}

				; http://i.imgur.com/abuFdZ2.png
				define void @multiple_pre(i8* %a, i8 %b, i1 %c, i1 %d) {
				; CHECK-LABEL: @multiple_pre(
				; CHECK-NEXT: bb0:
				; CHECK-NEXT: [[R:%.]] = add i8 [[B:%.]], 1
				; CHECK-NEXT: br i1 [[C:%.]], label [[BB1:%.]], label [[BB2:%.*]]
				; CHECK: bb1:
				; CHECK-NEXT: [[S:%.*]] = add i8 [[R]], 2
				; CHECK-NEXT: br label [[BB3:%.*]]
				; CHECK: bb2:
				; CHECK-NEXT: br label [[BB3]]
				; CHECK: bb3:
				; CHECK-NEXT: [[TMP0:%.*]] = phi i8 [ [[R]], [[BB2]] ], [ [[S]], [[BB1]] ]
				; CHECK-NEXT: br i1 [[D:%.]], label [[BB4:%.]], label [[BB5:%.*]]
				; CHECK: bb4:
				; CHECK-NEXT: store i8 [[R]], i8* [[A:%.*]]
				; CHECK-NEXT: br label [[EX:%.*]]
				; CHECK: bb5:
				; CHECK-NEXT: store i8 [[TMP0]], i8* [[A]]
				; CHECK-NEXT: br label [[EX]]
				; CHECK: ex:
				; CHECK-NEXT: ret void
				;
				bb0:
				%r = add i8 %b, 1
				br i1 %c, label %bb1, label %bb2
				bb1:
				%s = add i8 %r, 2
				store i8 %s, i8* %a
				br label %bb3
				bb2:
				store i8 %r, i8* %a
				br label %bb3
				bb3:
				br i1 %d, label %bb4, label %bb5
				bb4:
				store i8 %r, i8* %a
				br label %ex
				bb5:
				filcabUnsubmitted Not Done Reply Inline Actions I'd rather have an ASCII diagram instead of relying on an external image service (also hard to look at when reading tests). filcab: I'd rather have an ASCII diagram instead of relying on an external image service (also hard to…
				br label %ex
				ex:
				ret void
				}

				define void @unable_to_elim(i8* %a, i8 %b, i1 %c, i1 %d) {
				; CHECK-LABEL: @unable_to_elim(
				; CHECK-NEXT: bb0:
				; CHECK-NEXT: [[R:%.]] = add i8 [[B:%.]], 1
				; CHECK-NEXT: br i1 [[C:%.]], label [[BB1:%.]], label [[BB2:%.*]]
				; CHECK: bb1:
				; CHECK-NEXT: [[S:%.*]] = add i8 [[R]], 2
				; CHECK-NEXT: call void @llvm.memset.p0i8.i64(i8* [[A:%.*]], i8 [[S]], i64 1, i32 1, i1 false)
				; CHECK-NEXT: br label [[BB3:%.*]]
				; CHECK: bb2:
				; CHECK-NEXT: store i8 [[R]], i8* [[A]]
				; CHECK-NEXT: br label [[BB3]]
				; CHECK: bb3:
				; CHECK-NEXT: br i1 [[D:%.]], label [[BB4:%.]], label [[BB5:%.*]]
				; CHECK: bb4:
				; CHECK-NEXT: store i8 [[R]], i8* [[A]]
				; CHECK-NEXT: br label [[EX:%.*]]
				; CHECK: bb5:
				; CHECK-NEXT: br label [[EX]]
				; CHECK: ex:
				; CHECK-NEXT: ret void
				;
				bb0:
				%r = add i8 %b, 1
				br i1 %c, label %bb1, label %bb2
				bb1:
				%s = add i8 %r, 2
				call void @llvm.memset.p0i8.i64(i8* %a, i8 %s, i64 1, i32 1, i1 false)
				br label %bb3
				bb2:
				store i8 %r, i8* %a
				br label %bb3
				bb3:
				br i1 %d, label %bb4, label %bb5
				bb4:
				store i8 %r, i8* %a
				br label %ex
				bb5:
				br label %ex
				ex:
				ret void
				}

				; FIXME: PDSE-ing
				;
				; a, b, c --- lambda ---
				; \|
				; +------- c, b, a
				;
				; into:
				;
				; --- lambda --- a, b, c
				; \|
				; +------- c, b, a
				;
				; would require multiple rounds of willBeAnt
				define void @pre_blocked(i8* %a, i8* %b, i8* %c, i1 %br0) {
				; CHECK-LABEL: @pre_blocked(
				; CHECK-NEXT: bb0:
				; CHECK-NEXT: store i8 1, i8* [[A:%.*]]
				; CHECK-NEXT: store i8 1, i8* [[B:%.*]]
				; CHECK-NEXT: br i1 [[BR0:%.]], label [[BB1:%.]], label [[BB2:%.*]]
				; CHECK: bb1:
				; CHECK-NEXT: store i8 1, i8* [[C:%.*]]
				; CHECK-NEXT: br label [[BB3:%.*]]
				; CHECK: bb2:
				; CHECK-NEXT: store i8 11, i8* [[C]]
				; CHECK-NEXT: store i8 11, i8* [[B]]
				; CHECK-NEXT: store i8 11, i8* [[A]]
				; CHECK-NEXT: br label [[BB3]]
				; CHECK: bb3:
				; CHECK-NEXT: ret void
				;
				bb0:
				store i8 1, i8* %a
				store i8 1, i8* %b
				store i8 1, i8* %c
				br i1 %br0, label %bb1, label %bb2
				bb1:
				br label %bb3
				bb2:
				store i8 11, i8* %c
				store i8 11, i8* %b
				store i8 11, i8* %a
				br label %bb3
				bb3:
				ret void
				}

				; FIXME: Should transform this:
				;
				; s, s' --- lambda ---
				; \|
				; +------- s
				;
				; into:
				;
				; --- lambda --- s, s'
				; \|
				; +------- s'
				define void @pre_blocked_again(i64* %a, i1 %br0) {
				; CHECK-LABEL: @pre_blocked_again(
				; CHECK-NEXT: bb0:
				; CHECK-NEXT: store i64 1, i64* [[A:%.*]]
				; CHECK-NEXT: [[X:%.]] = bitcast i64 [[A]] to i8*
				; CHECK-NEXT: [[B:%.]] = getelementptr i8, i8 [[X]], i64 1
				; CHECK-NEXT: store i8 2, i8* [[B]]
				; CHECK-NEXT: br i1 [[BR0:%.]], label [[BB1:%.]], label [[BB2:%.*]]
				; CHECK: bb1:
				; CHECK-NEXT: store i64 1, i64* [[A]]
				; CHECK-NEXT: br label [[BB3:%.*]]
				; CHECK: bb2:
				; CHECK-NEXT: br label [[BB3]]
				; CHECK: bb3:
				; CHECK-NEXT: ret void
				;
				bb0:
				store i64 1, i64* %a
				%x = bitcast i64* %a to i8*
				%b = getelementptr i8, i8* %x, i64 1
				store i8 2, i8* %b
				br i1 %br0, label %bb1, label %bb2
				bb1:
				store i64 1, i64* %a
				br label %bb3
				bb2:
				br label %bb3
				bb3:
				ret void
				}

				define void @never_escapes() {
				; CHECK-LABEL: @never_escapes(
				; CHECK-NEXT: bb0:
				; CHECK-NEXT: br label [[BB1:%.*]]
				; CHECK: bb1:
				; CHECK-NEXT: br label [[BB2:%.*]]
				; CHECK: bb2:
				; CHECK-NEXT: ret void
				;
				bb0:
				%a = alloca i8
				br label %bb1
				bb1:
				store i8 12, i8* %a
				br label %bb2
				bb2:
				ret void
				}

This is an archive of the discontinued LLVM Phabricator instance.

[PDSE] Add PDSE.
Needs RevisionPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 91139

include/llvm/LinkAllPasses.h

include/llvm/Transforms/IPO/PassManagerBuilder.h

include/llvm/Transforms/Scalar.h

lib/Transforms/IPO/PassManagerBuilder.cpp

lib/Transforms/Scalar/PDSE.cpp

test/Transforms/DeadStoreElimination/pdse.ll

This is an archive of the discontinued LLVM Phabricator instance.

[PDSE] Add PDSE.Needs RevisionPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 91139

include/llvm/LinkAllPasses.h

include/llvm/Transforms/IPO/PassManagerBuilder.h

include/llvm/Transforms/Scalar.h

lib/Transforms/IPO/PassManagerBuilder.cpp

lib/Transforms/Scalar/PDSE.cpp

test/Transforms/DeadStoreElimination/pdse.ll

[PDSE] Add PDSE.
Needs RevisionPublic