Diff 526640

llvm/include/llvm/Transforms/Scalar/Reassociate.h

Show All 31 Lines
namespace llvm {		namespace llvm {

class APInt;		class APInt;
class BasicBlock;		class BasicBlock;
class BinaryOperator;		class BinaryOperator;
class Function;		class Function;
class Instruction;		class Instruction;
class IRBuilderBase;		class IRBuilderBase;
		class LoopInfo;
class Value;		class Value;

/// A private "module" namespace for types and utilities used by Reassociate.		/// A private "module" namespace for types and utilities used by Reassociate.
/// These are implementation details and should not be used by clients.		/// These are implementation details and should not be used by clients.
namespace reassociate {		namespace reassociate {

struct ValueEntry {		struct ValueEntry {
unsigned Rank;		unsigned Rank;
▲ Show 20 Lines • Show All 43 Lines • ▼ Show 20 Lines	protected:
};		};
DenseMap<std::pair<Value , Value >, PairMapValue> PairMap[NumBinaryOps];		DenseMap<std::pair<Value , Value >, PairMapValue> PairMap[NumBinaryOps];

bool MadeChange;		bool MadeChange;

public:		public:
PreservedAnalyses run(Function &F, FunctionAnalysisManager &);		PreservedAnalyses run(Function &F, FunctionAnalysisManager &);

		// Glue for old PM.
		bool runImpl(Function &F, LoopInfo &LI);

private:		private:
void BuildRankMap(Function &F, ReversePostOrderTraversal<Function *> &RPOT);		void BuildRankMap(Function &F, ReversePostOrderTraversal<Function *> &RPOT);
unsigned getRank(Value *V);		unsigned getRank(Value *V);
void canonicalizeOperands(Instruction *I);		void canonicalizeOperands(Instruction *I);
void ReassociateExpression(BinaryOperator *I);		void ReassociateExpression(BinaryOperator *I, LoopInfo &LI);
void RewriteExprTree(BinaryOperator *I,		void RewriteExprTree(BinaryOperator *I,
SmallVectorImpl<reassociate::ValueEntry> &Ops);		SmallVectorImpl<reassociate::ValueEntry> &Ops);
Value OptimizeExpression(BinaryOperator I,		Value OptimizeExpression(BinaryOperator I,
SmallVectorImpl<reassociate::ValueEntry> &Ops);		SmallVectorImpl<reassociate::ValueEntry> &Ops,
		LoopInfo &LI);
Value OptimizeAdd(Instruction I,		Value OptimizeAdd(Instruction I,
SmallVectorImpl<reassociate::ValueEntry> &Ops);		SmallVectorImpl<reassociate::ValueEntry> &Ops,
		LoopInfo &LI);
Value OptimizeXor(Instruction I,		Value OptimizeXor(Instruction I,
SmallVectorImpl<reassociate::ValueEntry> &Ops);		SmallVectorImpl<reassociate::ValueEntry> &Ops);
bool CombineXorOpnd(Instruction I, reassociate::XorOpnd Opnd1,		bool CombineXorOpnd(Instruction I, reassociate::XorOpnd Opnd1,
APInt &ConstOpnd, Value *&Res);		APInt &ConstOpnd, Value *&Res);
bool CombineXorOpnd(Instruction I, reassociate::XorOpnd Opnd1,		bool CombineXorOpnd(Instruction I, reassociate::XorOpnd Opnd1,
reassociate::XorOpnd *Opnd2, APInt &ConstOpnd,		reassociate::XorOpnd *Opnd2, APInt &ConstOpnd,
Value *&Res);		Value *&Res);
Value *buildMinimalMultiplyDAG(IRBuilderBase &Builder,		Value *buildMinimalMultiplyDAG(IRBuilderBase &Builder,
SmallVectorImpl<reassociate::Factor> &Factors);		SmallVectorImpl<reassociate::Factor> &Factors);
Value OptimizeMul(BinaryOperator I,		Value OptimizeMul(BinaryOperator I,
SmallVectorImpl<reassociate::ValueEntry> &Ops);		SmallVectorImpl<reassociate::ValueEntry> &Ops);
Value RemoveFactorFromExpression(Value V, Value *Factor);		Value RemoveFactorFromExpression(Value V, Value *Factor);
void EraseInst(Instruction *I);		void EraseInst(Instruction *I);
void RecursivelyEraseDeadInsts(Instruction *I, OrderedSet &Insts);		void RecursivelyEraseDeadInsts(Instruction *I, OrderedSet &Insts);
void OptimizeInst(Instruction *I);		void OptimizeInst(Instruction *I, LoopInfo &LI);
Instruction canonicalizeNegFPConstantsForOp(Instruction I, Instruction *Op,		Instruction canonicalizeNegFPConstantsForOp(Instruction I, Instruction *Op,
Value *OtherOp);		Value *OtherOp);
Instruction canonicalizeNegFPConstants(Instruction I);		Instruction canonicalizeNegFPConstants(Instruction I);
void BuildPairMap(ReversePostOrderTraversal<Function *> &RPOT);		void BuildPairMap(ReversePostOrderTraversal<Function *> &RPOT);
};		};

} // end namespace llvm		} // end namespace llvm

#endif // LLVM_TRANSFORMS_SCALAR_REASSOCIATE_H		#endif // LLVM_TRANSFORMS_SCALAR_REASSOCIATE_H

llvm/lib/Transforms/Scalar/Reassociate.cpp

Show All 25 Lines
#include "llvm/ADT/PostOrderIterator.h"		#include "llvm/ADT/PostOrderIterator.h"
#include "llvm/ADT/SmallPtrSet.h"		#include "llvm/ADT/SmallPtrSet.h"
#include "llvm/ADT/SmallSet.h"		#include "llvm/ADT/SmallSet.h"
#include "llvm/ADT/SmallVector.h"		#include "llvm/ADT/SmallVector.h"
#include "llvm/ADT/Statistic.h"		#include "llvm/ADT/Statistic.h"
#include "llvm/Analysis/BasicAliasAnalysis.h"		#include "llvm/Analysis/BasicAliasAnalysis.h"
#include "llvm/Analysis/ConstantFolding.h"		#include "llvm/Analysis/ConstantFolding.h"
#include "llvm/Analysis/GlobalsModRef.h"		#include "llvm/Analysis/GlobalsModRef.h"
		#include "llvm/Analysis/LoopInfo.h"
#include "llvm/Analysis/ValueTracking.h"		#include "llvm/Analysis/ValueTracking.h"
#include "llvm/IR/Argument.h"		#include "llvm/IR/Argument.h"
#include "llvm/IR/BasicBlock.h"		#include "llvm/IR/BasicBlock.h"
#include "llvm/IR/CFG.h"		#include "llvm/IR/CFG.h"
#include "llvm/IR/Constant.h"		#include "llvm/IR/Constant.h"
#include "llvm/IR/Constants.h"		#include "llvm/IR/Constants.h"
#include "llvm/IR/Function.h"		#include "llvm/IR/Function.h"
#include "llvm/IR/IRBuilder.h"		#include "llvm/IR/IRBuilder.h"
Show All 11 Lines
#include "llvm/Pass.h"		#include "llvm/Pass.h"
#include "llvm/Support/Casting.h"		#include "llvm/Support/Casting.h"
#include "llvm/Support/Debug.h"		#include "llvm/Support/Debug.h"
#include "llvm/Support/raw_ostream.h"		#include "llvm/Support/raw_ostream.h"
#include "llvm/Transforms/Scalar.h"		#include "llvm/Transforms/Scalar.h"
#include "llvm/Transforms/Utils/Local.h"		#include "llvm/Transforms/Utils/Local.h"
#include <algorithm>		#include <algorithm>
#include <cassert>		#include <cassert>
		#include <functional>
#include <utility>		#include <utility>

using namespace llvm;		using namespace llvm;
using namespace reassociate;		using namespace reassociate;
using namespace PatternMatch;		using namespace PatternMatch;

#define DEBUG_TYPE "reassociate"		#define DEBUG_TYPE "reassociate"

▲ Show 20 Lines • Show All 1,459 Lines • ▼ Show 20 Lines	Value ReassociatePass::OptimizeXor(Instruction I,

return nullptr;		return nullptr;
}		}

/// Optimize a series of operands to an 'add' instruction. This		/// Optimize a series of operands to an 'add' instruction. This
/// optimizes based on identities. If it can be reduced to a single Value, it		/// optimizes based on identities. If it can be reduced to a single Value, it
/// is returned, otherwise the Ops list is mutated as necessary.		/// is returned, otherwise the Ops list is mutated as necessary.
Value ReassociatePass::OptimizeAdd(Instruction I,		Value ReassociatePass::OptimizeAdd(Instruction I,
SmallVectorImpl<ValueEntry> &Ops) {		SmallVectorImpl<ValueEntry> &Ops,
		LoopInfo &LI) {
// Scan the operand lists looking for X and -X pairs. If we find any, we		// Scan the operand lists looking for X and -X pairs. If we find any, we
// can simplify expressions like X+-X == 0 and X+~X ==-1. While we're at it,		// can simplify expressions like X+-X == 0 and X+~X ==-1. While we're at it,
// scan for any		// scan for any
// duplicates. We want to canonicalize Y+Y+Y+Z -> 3*Y+Z.		// duplicates. We want to canonicalize Y+Y+Y+Z -> 3*Y+Z.

for (unsigned i = 0, e = Ops.size(); i != e; ++i) {		for (unsigned i = 0, e = Ops.size(); i != e; ++i) {
Value *TheOp = Ops[i].Op;		Value *TheOp = Ops[i].Op;
// Check to see if we've seen this operand before. If so, we factor all		// Check to see if we've seen this operand before. If so, we factor all
▲ Show 20 Lines • Show All 139 Lines • ▼ Show 20 Lines	Value ReassociatePass::OptimizeAdd(Instruction I,
}		}

// If any factor occurred more than one time, we can pull it out.		// If any factor occurred more than one time, we can pull it out.
if (MaxOcc > 1) {		if (MaxOcc > 1) {
LLVM_DEBUG(dbgs() << "\nFACTORING [" << MaxOcc << "]: " << *MaxOccVal		LLVM_DEBUG(dbgs() << "\nFACTORING [" << MaxOcc << "]: " << *MaxOccVal
<< '\n');		<< '\n');
++NumFactor;		++NumFactor;

		// This transformation can potentially move a loop invariant computation
		// into the loop. This should be avoided as it increases the number of
		// computations and has potential to prevent other optimizations that would
		// need to know how to revert this transformation in order to succeed.

		nikicUnsubmitted Done Reply Inline Actions These need to be fetched from the pass manager instead. nikic: These need to be fetched from the pass manager instead.
		pawosm01AuthorUnsubmitted Done Reply Inline Actions OK, used pass manager instead. pawosm01: OK, used pass manager instead.
		// Go through the operations and see if all the operands belong to the same
		// loop.
		nikicUnsubmitted Done Reply Inline Actions Should be just `LoopInfo`. nikic: Should be just `LoopInfo`.
		pawosm01AuthorUnsubmitted Done Reply Inline Actions Although this place has gone, I've considered your suggestion in the other place below. pawosm01: Although this place has gone, I've considered your suggestion in the other place below.
		for (unsigned i = 0, e = Ops.size(); i != e; ++i) {
		// Only consider expressions we're allowed to transform.
		BinaryOperator *BOp =
		isReassociableOp(Ops[i].Op, Instruction::Mul, Instruction::FMul);
		qcolombetUnsubmitted Not Done Reply Inline Actions Although it is less performance sensitive, pulling adds in a loop could also be problematic. qcolombet: Although it is less performance sensitive, pulling adds in a loop could also be problematic.
		if (!BOp)
		continue;
		tschuettUnsubmitted Done Reply Inline Actions for (unsigned i = 0, size_t e = Ops.size(); i != e; ++i) { } tschuett: for (unsigned i = 0, size_t e = Ops.size(); i != e; ++i) { }
		pawosm01AuthorUnsubmitted Done Reply Inline Actions Thanks for spotting that! pawosm01: Thanks for spotting that!

		if (Loop *L = LI.getLoopFor(BOp->getParent())) {
		qcolombetUnsubmitted Not Done Reply Inline Actions Early exit to reduce indentation qcolombet: Early exit to reduce indentation
		// Make sure we're not pulling operands from the outside of the loop.
		for (Value *Operand : BOp->operands()) {
		std::function<bool(LoopInfo &, Value , Loop )> isInOneLoop =
		[&isInOneLoop](LoopInfo &LI, Value V, Loop L) -> bool {
		Instruction *I = dyn_cast<Instruction>(V);

		if (!I)
		return true;
		if ((LI.getLoopFor(I->getParent()) != L) \|\| (dyn_cast<PHINode>(I)))
		return false;
		qcolombetUnsubmitted Not Done Reply Inline Actions Shouldn't PHIs with the same loop as L return `true` here? qcolombet: Shouldn't PHIs with the same loop as L return `true` here?
		for (Value *Operand : I->operands()) {
		if (!isInOneLoop(LI, Operand, L))
		return false;
		}
		return true;
		};
		std::function<bool(Value , Value )> hasFactor =
		[&hasFactor](Value V, Value Factor) -> bool {
		BinaryOperator *BO =
		isReassociableOp(V, Instruction::Mul, Instruction::FMul);

		if (!BO)
		return V == Factor;
		nikicUnsubmitted Done Reply Inline Actions This looks like a very complicated and inefficient re-implementation of `LI->getLoopFor()`. nikic: This looks like a very complicated and inefficient re-implementation of `LI->getLoopFor()`.
		pawosm01AuthorUnsubmitted Done Reply Inline Actions using LI->getLoopFor() instead now. pawosm01: using LI->getLoopFor() instead now.
		for (Value *Operand : BO->operands()) {
		if (hasFactor(Operand, Factor))
		return true;
		}
		return false;
		};

		// Only the operands using the factor are being transformed.
		if ((hasFactor(Operand, MaxOccVal)) && (!isInOneLoop(LI, Operand, L)))
		return nullptr; // Transformation not profitable, giving up.
		qcolombetUnsubmitted Not Done Reply Inline Actions TL;DR I think the model should be more general than that but as it is, it is probably a good proxy for not shooting ourselves in the foot. The problem is not pulling something into a loop, the problem is replacing X something with 1 * frequency-of-the-target-basic-block something. I.e., let's imagine we have: v1 = s1 * delta v2 = s2 * delta ... vN = sN delta for () { v1 + ... + vN // with loop dependent stuff } Transforming this into: for () { (s1 + ... + sN) delta } Could actually be beneficial as long as the loop count is smaller than N. Similarly, something like: for () { if (unlikely) v1 + ... + vN } Is even more likely to be beneficial since the expected frequency of the basic block may be smaller than the source basic block. qcolombet: TL;DR I think the model should be more general than that but as it is, it is probably a good…
		pawosm01AuthorUnsubmitted Not Done Reply Inline Actions Transforming this into: Could actually be beneficial as long as the loop count is smaller than N. Yes, I was afraid that with this change I'm cutting off some of the beneficial transformations, and making the logic of this pass more complicated than necessary. Therefore I tend to agree with Florian, that this problem could be addressed in LICM instead. In the end, it's not a wrong thing for a transformation pass to undo whatever previous pass(es) did when there is a new knowledge available (and here, the new knowledge is that we are in a loop). I'm very close to giving up this commit and work on extending `hoistArithmetics()` (of LICM) with the ability to spot this code pattern. As I mentioned in the other comment, currently LICM can't figure it out even if it wasn't caused by Reassociate pass, namely a simple C code that I specifically crafted to replicate this problem was enough to show that GCC produces faster executable than LLVM. But there's a problem with LICM too. This `hoistArithmetics()` function and its surrounding is getting more and more complicated already. And I assume any attempt to extend it with ability to deal with the situation discussed here, will create a lot of code bloat. But maybe that's something inevitable. pawosm01: > Transforming this into: Could actually be beneficial as long as the loop count is smaller…
		}
		}
		}

// Create a new instruction that uses the MaxOccVal twice. If we don't do		// Create a new instruction that uses the MaxOccVal twice. If we don't do
// this, we could otherwise run into situations where removing a factor		// this, we could otherwise run into situations where removing a factor
// from an expression will drop a use of maxocc, and this can cause		// from an expression will drop a use of maxocc, and this can cause
// RemoveFactorFromExpression on successive values to behave differently.		// RemoveFactorFromExpression on successive values to behave differently.
Instruction *DummyInst =		Instruction *DummyInst =
I->getType()->isIntOrIntVectorTy()		I->getType()->isIntOrIntVectorTy()
? BinaryOperator::CreateAdd(MaxOccVal, MaxOccVal)		? BinaryOperator::CreateAdd(MaxOccVal, MaxOccVal)
: BinaryOperator::CreateFAdd(MaxOccVal, MaxOccVal);		: BinaryOperator::CreateFAdd(MaxOccVal, MaxOccVal);
▲ Show 20 Lines • Show All 226 Lines • ▼ Show 20 Lines	if (Ops.empty())
return V;		return V;

ValueEntry NewEntry = ValueEntry(getRank(V), V);		ValueEntry NewEntry = ValueEntry(getRank(V), V);
Ops.insert(llvm::lower_bound(Ops, NewEntry), NewEntry);		Ops.insert(llvm::lower_bound(Ops, NewEntry), NewEntry);
return nullptr;		return nullptr;
}		}

Value ReassociatePass::OptimizeExpression(BinaryOperator I,		Value ReassociatePass::OptimizeExpression(BinaryOperator I,
SmallVectorImpl<ValueEntry> &Ops) {		SmallVectorImpl<ValueEntry> &Ops,
		LoopInfo &LI) {
// Now that we have the linearized expression tree, try to optimize it.		// Now that we have the linearized expression tree, try to optimize it.
// Start by folding any constants that we found.		// Start by folding any constants that we found.
const DataLayout &DL = I->getModule()->getDataLayout();		const DataLayout &DL = I->getModule()->getDataLayout();
Constant *Cst = nullptr;		Constant *Cst = nullptr;
unsigned Opcode = I->getOpcode();		unsigned Opcode = I->getOpcode();
while (!Ops.empty()) {		while (!Ops.empty()) {
if (auto *C = dyn_cast<Constant>(Ops.back().Op)) {		if (auto *C = dyn_cast<Constant>(Ops.back().Op)) {
if (!Cst) {		if (!Cst) {
Show All 37 Lines	Value ReassociatePass::OptimizeExpression(BinaryOperator I,

case Instruction::Xor:		case Instruction::Xor:
if (Value *Result = OptimizeXor(I, Ops))		if (Value *Result = OptimizeXor(I, Ops))
return Result;		return Result;
break;		break;

case Instruction::Add:		case Instruction::Add:
case Instruction::FAdd:		case Instruction::FAdd:
if (Value *Result = OptimizeAdd(I, Ops))		if (Value *Result = OptimizeAdd(I, Ops, LI))
return Result;		return Result;
break;		break;

case Instruction::Mul:		case Instruction::Mul:
case Instruction::FMul:		case Instruction::FMul:
if (Value *Result = OptimizeMul(I, Ops))		if (Value *Result = OptimizeMul(I, Ops))
return Result;		return Result;
break;		break;
}		}

if (Ops.size() != NumOps)		if (Ops.size() != NumOps)
return OptimizeExpression(I, Ops);		return OptimizeExpression(I, Ops, LI);
return nullptr;		return nullptr;
}		}

// Remove dead instructions and if any operands are trivially dead add them to		// Remove dead instructions and if any operands are trivially dead add them to
// Insts so they will be removed as well.		// Insts so they will be removed as well.
void ReassociatePass::RecursivelyEraseDeadInsts(Instruction *I,		void ReassociatePass::RecursivelyEraseDeadInsts(Instruction *I,
OrderedSet &Insts) {		OrderedSet &Insts) {
assert(isInstructionTriviallyDead(I) && "Trivially dead instructions only!");		assert(isInstructionTriviallyDead(I) && "Trivially dead instructions only!");
▲ Show 20 Lines • Show All 168 Lines • ▼ Show 20 Lines	Instruction ReassociatePass::canonicalizeNegFPConstants(Instruction I) {
if (match(I, m_FSub(m_Value(X), m_OneUse(m_Instruction(Op)))))		if (match(I, m_FSub(m_Value(X), m_OneUse(m_Instruction(Op)))))
if (Instruction *R = canonicalizeNegFPConstantsForOp(I, Op, X))		if (Instruction *R = canonicalizeNegFPConstantsForOp(I, Op, X))
I = R;		I = R;
return I;		return I;
}		}

/// Inspect and optimize the given instruction. Note that erasing		/// Inspect and optimize the given instruction. Note that erasing
/// instructions is not allowed.		/// instructions is not allowed.
void ReassociatePass::OptimizeInst(Instruction *I) {		void ReassociatePass::OptimizeInst(Instruction *I, LoopInfo &LI) {
// Only consider operations that we understand.		// Only consider operations that we understand.
if (!isa<UnaryOperator>(I) && !isa<BinaryOperator>(I))		if (!isa<UnaryOperator>(I) && !isa<BinaryOperator>(I))
return;		return;

if (I->getOpcode() == Instruction::Shl && isa<ConstantInt>(I->getOperand(1)))		if (I->getOpcode() == Instruction::Shl && isa<ConstantInt>(I->getOperand(1)))
// If an operand of this shift is a reassociable multiply, or if the shift		// If an operand of this shift is a reassociable multiply, or if the shift
// is used by a reassociable multiply or add, turn into a multiply.		// is used by a reassociable multiply or add, turn into a multiply.
if (isReassociableOp(I->getOperand(0), Instruction::Mul) \|\|		if (isReassociableOp(I->getOperand(0), Instruction::Mul) \|\|
▲ Show 20 Lines • Show All 119 Lines • ▼ Show 20 Lines	void ReassociatePass::OptimizeInst(Instruction *I, LoopInfo &LI) {
// until we process the subtract.		// until we process the subtract.
if (BO->hasOneUse() && BO->getOpcode() == Instruction::Add &&		if (BO->hasOneUse() && BO->getOpcode() == Instruction::Add &&
cast<Instruction>(BO->user_back())->getOpcode() == Instruction::Sub)		cast<Instruction>(BO->user_back())->getOpcode() == Instruction::Sub)
return;		return;
if (BO->hasOneUse() && BO->getOpcode() == Instruction::FAdd &&		if (BO->hasOneUse() && BO->getOpcode() == Instruction::FAdd &&
cast<Instruction>(BO->user_back())->getOpcode() == Instruction::FSub)		cast<Instruction>(BO->user_back())->getOpcode() == Instruction::FSub)
return;		return;

ReassociateExpression(BO);		ReassociateExpression(BO, LI);
}		}

void ReassociatePass::ReassociateExpression(BinaryOperator *I) {		void ReassociatePass::ReassociateExpression(BinaryOperator *I, LoopInfo &LI) {
// First, walk the expression tree, linearizing the tree, collecting the		// First, walk the expression tree, linearizing the tree, collecting the
// operand information.		// operand information.
SmallVector<RepeatedValue, 8> Tree;		SmallVector<RepeatedValue, 8> Tree;
MadeChange \|= LinearizeExprTree(I, Tree, RedoInsts);		MadeChange \|= LinearizeExprTree(I, Tree, RedoInsts);
SmallVector<ValueEntry, 8> Ops;		SmallVector<ValueEntry, 8> Ops;
Ops.reserve(Tree.size());		Ops.reserve(Tree.size());
for (const RepeatedValue &E : Tree)		for (const RepeatedValue &E : Tree)
Ops.append(E.second.getZExtValue(), ValueEntry(getRank(E.first), E.first));		Ops.append(E.second.getZExtValue(), ValueEntry(getRank(E.first), E.first));

LLVM_DEBUG(dbgs() << "RAIn:\t"; PrintOps(I, Ops); dbgs() << '\n');		LLVM_DEBUG(dbgs() << "RAIn:\t"; PrintOps(I, Ops); dbgs() << '\n');

// Now that we have linearized the tree to a list and have gathered all of		// Now that we have linearized the tree to a list and have gathered all of
// the operands and their ranks, sort the operands by their rank. Use a		// the operands and their ranks, sort the operands by their rank. Use a
// stable_sort so that values with equal ranks will have their relative		// stable_sort so that values with equal ranks will have their relative
// positions maintained (and so the compiler is deterministic). Note that		// positions maintained (and so the compiler is deterministic). Note that
// this sorts so that the highest ranking values end up at the beginning of		// this sorts so that the highest ranking values end up at the beginning of
// the vector.		// the vector.
llvm::stable_sort(Ops);		llvm::stable_sort(Ops);

// Now that we have the expression tree in a convenient		// Now that we have the expression tree in a convenient
// sorted form, optimize it globally if possible.		// sorted form, optimize it globally if possible.
if (Value *V = OptimizeExpression(I, Ops)) {		if (Value *V = OptimizeExpression(I, Ops, LI)) {
if (V == I)		if (V == I)
// Self-referential expression in unreachable code.		// Self-referential expression in unreachable code.
return;		return;
// This expression tree simplified to something that isn't a tree,		// This expression tree simplified to something that isn't a tree,
// eliminate it.		// eliminate it.
LLVM_DEBUG(dbgs() << "Reassoc to scalar: " << *V << '\n');		LLVM_DEBUG(dbgs() << "Reassoc to scalar: " << *V << '\n');
I->replaceAllUsesWith(V);		I->replaceAllUsesWith(V);
if (Instruction *VI = dyn_cast<Instruction>(V))		if (Instruction *VI = dyn_cast<Instruction>(V))
▲ Show 20 Lines • Show All 147 Lines • ▼ Show 20 Lines	for (Instruction &I : *BI) {
++res.first->second.Score;		++res.first->second.Score;
}		}
}		}
}		}
}		}
}		}
}		}

PreservedAnalyses ReassociatePass::run(Function &F, FunctionAnalysisManager &) {		bool ReassociatePass::runImpl(Function &F, LoopInfo &LI) {
// Get the functions basic blocks in Reverse Post Order. This order is used by		// Get the functions basic blocks in Reverse Post Order. This order is used by
// BuildRankMap to pre calculate ranks correctly. It also excludes dead basic		// BuildRankMap to pre calculate ranks correctly. It also excludes dead basic
// blocks (it has been seen that the analysis in this pass could hang when		// blocks (it has been seen that the analysis in this pass could hang when
// analysing dead basic blocks).		// analysing dead basic blocks).
ReversePostOrderTraversal<Function *> RPOT(&F);		ReversePostOrderTraversal<Function *> RPOT(&F);

// Calculate the rank map for F.		// Calculate the rank map for F.
BuildRankMap(F, RPOT);		BuildRankMap(F, RPOT);
Show All 14 Lines	bool ReassociatePass::runImpl(Function &F, LoopInfo &LI) {
// Traverse the same blocks that were analysed by BuildRankMap.		// Traverse the same blocks that were analysed by BuildRankMap.
for (BasicBlock *BI : RPOT) {		for (BasicBlock *BI : RPOT) {
assert(RankMap.count(&*BI) && "BB should be ranked.");		assert(RankMap.count(&*BI) && "BB should be ranked.");
// Optimize every instruction in the basic block.		// Optimize every instruction in the basic block.
for (BasicBlock::iterator II = BI->begin(), IE = BI->end(); II != IE;)		for (BasicBlock::iterator II = BI->begin(), IE = BI->end(); II != IE;)
if (isInstructionTriviallyDead(&*II)) {		if (isInstructionTriviallyDead(&*II)) {
EraseInst(&*II++);		EraseInst(&*II++);
} else {		} else {
OptimizeInst(&*II);		OptimizeInst(&*II, LI);
assert(II->getParent() == &*BI && "Moved to a different block!");		assert(II->getParent() == &*BI && "Moved to a different block!");
++II;		++II;
}		}

// Make a copy of all the instructions to be redone so we can remove dead		// Make a copy of all the instructions to be redone so we can remove dead
// instructions.		// instructions.
OrderedSet ToRedo(RedoInsts);		OrderedSet ToRedo(RedoInsts);
// Iterate over all instructions to be reevaluated and remove trivially dead		// Iterate over all instructions to be reevaluated and remove trivially dead
Show All 11 Lines	for (BasicBlock *BI : RPOT) {
// Now that we have removed dead instructions, we can reoptimize the		// Now that we have removed dead instructions, we can reoptimize the
// remaining instructions.		// remaining instructions.
while (!RedoInsts.empty()) {		while (!RedoInsts.empty()) {
Instruction *I = RedoInsts.front();		Instruction *I = RedoInsts.front();
RedoInsts.erase(RedoInsts.begin());		RedoInsts.erase(RedoInsts.begin());
if (isInstructionTriviallyDead(I))		if (isInstructionTriviallyDead(I))
EraseInst(I);		EraseInst(I);
else		else
OptimizeInst(I);		OptimizeInst(I, LI);
}		}
}		}

// We are done with the rank map and pair map.		// We are done with the rank map and pair map.
RankMap.clear();		RankMap.clear();
ValueRankMap.clear();		ValueRankMap.clear();
for (auto &Entry : PairMap)		for (auto &Entry : PairMap)
Entry.clear();		Entry.clear();

if (MadeChange) {		return MadeChange;
PreservedAnalyses PA;
PA.preserveSet<CFGAnalyses>();
return PA;
}		}

		PreservedAnalyses ReassociatePass::run(Function &F,
		FunctionAnalysisManager &AM) {
		auto &LI = AM.getResult<LoopAnalysis>(F);

		if (!runImpl(F, LI))
return PreservedAnalyses::all();		return PreservedAnalyses::all();

		PreservedAnalyses PA;
		PA.preserveSet<CFGAnalyses>();
		return PA;
}		}

namespace {		namespace {

class ReassociateLegacyPass : public FunctionPass {		class ReassociateLegacyPass : public FunctionPass {
ReassociatePass Impl;		ReassociatePass Impl;

public:		public:
static char ID; // Pass identification, replacement for typeid		static char ID; // Pass identification, replacement for typeid

ReassociateLegacyPass() : FunctionPass(ID) {		ReassociateLegacyPass() : FunctionPass(ID) {
initializeReassociateLegacyPassPass(*PassRegistry::getPassRegistry());		initializeReassociateLegacyPassPass(*PassRegistry::getPassRegistry());
}		}

bool runOnFunction(Function &F) override {		bool runOnFunction(Function &F) override {
if (skipFunction(F))		if (skipFunction(F))
return false;		return false;
		return Impl.runImpl(F, getAnalysis<LoopInfoWrapperPass>().getLoopInfo());
FunctionAnalysisManager DummyFAM;
auto PA = Impl.run(F, DummyFAM);
return !PA.areAllPreserved();
}		}

void getAnalysisUsage(AnalysisUsage &AU) const override {		void getAnalysisUsage(AnalysisUsage &AU) const override {
AU.setPreservesCFG();		AU.setPreservesCFG();
AU.addPreserved<AAResultsWrapperPass>();		AU.addPreserved<AAResultsWrapperPass>();
AU.addPreserved<BasicAAWrapperPass>();		AU.addPreserved<BasicAAWrapperPass>();
AU.addPreserved<GlobalsAAWrapperPass>();		AU.addPreserved<GlobalsAAWrapperPass>();
		AU.addPreserved<LoopInfoWrapperPass>();
}		}
};		};

} // end anonymous namespace		} // end anonymous namespace

char ReassociateLegacyPass::ID = 0;		char ReassociateLegacyPass::ID = 0;

INITIALIZE_PASS(ReassociateLegacyPass, "reassociate",		INITIALIZE_PASS(ReassociateLegacyPass, "reassociate",
"Reassociate expressions", false, false)		"Reassociate expressions", false, false)

// Public interface to the Reassociate pass		// Public interface to the Reassociate pass
FunctionPass *llvm::createReassociatePass() {		FunctionPass *llvm::createReassociatePass() {
return new ReassociateLegacyPass();		return new ReassociateLegacyPass();
}		}

llvm/test/Other/new-pm-defaults.ll

	Show First 20 Lines • Show All 156 Lines • ▼ Show 20 Lines
	; CHECK-O23SZ-NEXT: Running pass: ConstraintEliminationPass			; CHECK-O23SZ-NEXT: Running pass: ConstraintEliminationPass
	; CHECK-O1-NEXT: Running pass: LibCallsShrinkWrapPass			; CHECK-O1-NEXT: Running pass: LibCallsShrinkWrapPass
	; CHECK-O2-NEXT: Running pass: LibCallsShrinkWrapPass			; CHECK-O2-NEXT: Running pass: LibCallsShrinkWrapPass
	; CHECK-O3-NEXT: Running pass: LibCallsShrinkWrapPass			; CHECK-O3-NEXT: Running pass: LibCallsShrinkWrapPass
	; CHECK-EP-PEEPHOLE-NEXT: Running pass: NoOpFunctionPass			; CHECK-EP-PEEPHOLE-NEXT: Running pass: NoOpFunctionPass
	; CHECK-O23SZ-NEXT: Running pass: TailCallElimPass			; CHECK-O23SZ-NEXT: Running pass: TailCallElimPass
	; CHECK-O-NEXT: Running pass: SimplifyCFGPass			; CHECK-O-NEXT: Running pass: SimplifyCFGPass
	; CHECK-O-NEXT: Running pass: ReassociatePass			; CHECK-O-NEXT: Running pass: ReassociatePass
	; CHECK-O-NEXT: Running pass: LoopSimplifyPass
	; CHECK-O-NEXT: Running analysis: LoopAnalysis			; CHECK-O-NEXT: Running analysis: LoopAnalysis
				; CHECK-O-NEXT: Running pass: LoopSimplifyPass
	; CHECK-O-NEXT: Running pass: LCSSAPass			; CHECK-O-NEXT: Running pass: LCSSAPass
	; CHECK-O-NEXT: Running analysis: ScalarEvolutionAnalysis			; CHECK-O-NEXT: Running analysis: ScalarEvolutionAnalysis
	; CHECK-O-NEXT: Running analysis: InnerAnalysisManagerProxy			; CHECK-O-NEXT: Running analysis: InnerAnalysisManagerProxy
	; CHECK-O-NEXT: Running pass: LoopInstSimplifyPass			; CHECK-O-NEXT: Running pass: LoopInstSimplifyPass
	; CHECK-O-NEXT: Running pass: LoopSimplifyCFGPass			; CHECK-O-NEXT: Running pass: LoopSimplifyCFGPass
	; CHECK-O-NEXT: Running pass: LICM			; CHECK-O-NEXT: Running pass: LICM
	; CHECK-O-NEXT: Running pass: LoopRotatePass			; CHECK-O-NEXT: Running pass: LoopRotatePass
	; CHECK-O-NEXT: Running pass: LICM			; CHECK-O-NEXT: Running pass: LICM
	▲ Show 20 Lines • Show All 137 Lines • Show Last 20 Lines

llvm/test/Other/new-pm-thinlto-postlink-defaults.ll

	Show First 20 Lines • Show All 93 Lines • ▼ Show 20 Lines
	; CHECK-O23SZ-NEXT: Running pass: AggressiveInstCombinePass			; CHECK-O23SZ-NEXT: Running pass: AggressiveInstCombinePass
	; CHECK-O23SZ-NEXT: Running pass: ConstraintEliminationPass			; CHECK-O23SZ-NEXT: Running pass: ConstraintEliminationPass
	; CHECK-O1-NEXT: Running pass: LibCallsShrinkWrapPass			; CHECK-O1-NEXT: Running pass: LibCallsShrinkWrapPass
	; CHECK-O2-NEXT: Running pass: LibCallsShrinkWrapPass			; CHECK-O2-NEXT: Running pass: LibCallsShrinkWrapPass
	; CHECK-O3-NEXT: Running pass: LibCallsShrinkWrapPass			; CHECK-O3-NEXT: Running pass: LibCallsShrinkWrapPass
	; CHECK-O23SZ-NEXT: Running pass: TailCallElimPass			; CHECK-O23SZ-NEXT: Running pass: TailCallElimPass
	; CHECK-O-NEXT: Running pass: SimplifyCFGPass			; CHECK-O-NEXT: Running pass: SimplifyCFGPass
	; CHECK-O-NEXT: Running pass: ReassociatePass			; CHECK-O-NEXT: Running pass: ReassociatePass
	; CHECK-O-NEXT: Running pass: LoopSimplifyPass
	; CHECK-O-NEXT: Running analysis: LoopAnalysis			; CHECK-O-NEXT: Running analysis: LoopAnalysis
				; CHECK-O-NEXT: Running pass: LoopSimplifyPass
	; CHECK-O-NEXT: Running pass: LCSSAPass			; CHECK-O-NEXT: Running pass: LCSSAPass
	; CHECK-O-NEXT: Running analysis: ScalarEvolutionAnalysis			; CHECK-O-NEXT: Running analysis: ScalarEvolutionAnalysis
	; CHECK-O-NEXT: Running analysis: InnerAnalysisManagerProxy			; CHECK-O-NEXT: Running analysis: InnerAnalysisManagerProxy
	; CHECK-O-NEXT: Running pass: LoopInstSimplifyPass			; CHECK-O-NEXT: Running pass: LoopInstSimplifyPass
	; CHECK-O-NEXT: Running pass: LoopSimplifyCFGPass			; CHECK-O-NEXT: Running pass: LoopSimplifyCFGPass
	; CHECK-O-NEXT: Running pass: LICM			; CHECK-O-NEXT: Running pass: LICM
	; CHECK-O-NEXT: Running pass: LoopRotatePass			; CHECK-O-NEXT: Running pass: LoopRotatePass
	; CHECK-O-NEXT: Running pass: LICM			; CHECK-O-NEXT: Running pass: LICM
	▲ Show 20 Lines • Show All 123 Lines • Show Last 20 Lines

llvm/test/Other/new-pm-thinlto-prelink-defaults.ll

	Show First 20 Lines • Show All 101 Lines • ▼ Show 20 Lines
	; CHECK-O23SZ-NEXT: Running pass: AggressiveInstCombinePass			; CHECK-O23SZ-NEXT: Running pass: AggressiveInstCombinePass
	; CHECK-O23SZ-NEXT: Running pass: ConstraintEliminationPass			; CHECK-O23SZ-NEXT: Running pass: ConstraintEliminationPass
	; CHECK-O1-NEXT: Running pass: LibCallsShrinkWrapPass			; CHECK-O1-NEXT: Running pass: LibCallsShrinkWrapPass
	; CHECK-O2-NEXT: Running pass: LibCallsShrinkWrapPass			; CHECK-O2-NEXT: Running pass: LibCallsShrinkWrapPass
	; CHECK-O3-NEXT: Running pass: LibCallsShrinkWrapPass			; CHECK-O3-NEXT: Running pass: LibCallsShrinkWrapPass
	; CHECK-O23SZ-NEXT: Running pass: TailCallElimPass			; CHECK-O23SZ-NEXT: Running pass: TailCallElimPass
	; CHECK-O-NEXT: Running pass: SimplifyCFGPass			; CHECK-O-NEXT: Running pass: SimplifyCFGPass
	; CHECK-O-NEXT: Running pass: ReassociatePass			; CHECK-O-NEXT: Running pass: ReassociatePass
	; CHECK-O-NEXT: Running pass: LoopSimplifyPass
	; CHECK-O-NEXT: Running analysis: LoopAnalysis			; CHECK-O-NEXT: Running analysis: LoopAnalysis
				; CHECK-O-NEXT: Running pass: LoopSimplifyPass
	; CHECK-O-NEXT: Running pass: LCSSAPass			; CHECK-O-NEXT: Running pass: LCSSAPass
	; CHECK-O-NEXT: Running analysis: ScalarEvolutionAnalysis			; CHECK-O-NEXT: Running analysis: ScalarEvolutionAnalysis
	; CHECK-O-NEXT: Running analysis: InnerAnalysisManagerProxy			; CHECK-O-NEXT: Running analysis: InnerAnalysisManagerProxy
	; CHECK-O-NEXT: Running pass: LoopInstSimplifyPass			; CHECK-O-NEXT: Running pass: LoopInstSimplifyPass
	; CHECK-O-NEXT: Running pass: LoopSimplifyCFGPass			; CHECK-O-NEXT: Running pass: LoopSimplifyCFGPass
	; CHECK-O-NEXT: Running pass: LICM			; CHECK-O-NEXT: Running pass: LICM
	; CHECK-O-NEXT: Running pass: LoopRotatePass			; CHECK-O-NEXT: Running pass: LoopRotatePass
	; CHECK-O-NEXT: Running pass: LICM			; CHECK-O-NEXT: Running pass: LICM
	▲ Show 20 Lines • Show All 84 Lines • Show Last 20 Lines

llvm/test/Transforms/Reassociate/reassociate-not-from-the-outside-of-the-loop.ll

				; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2
	; RUN: opt -passes=reassociate -S < %s \| FileCheck %s			; RUN: opt -passes=reassociate -S < %s \| FileCheck %s
				nikicUnsubmitted Done Reply Inline Actions Should use update_test_checks.py. nikic: Should use update_test_checks.py.
				pawosm01AuthorUnsubmitted Not Done Reply Inline Actions It will make it look like this: --- a/llvm/test/Transforms/Reassociate/reassociate-not-from-the-outside-of-the-loop.ll +++ b/llvm/test/Transforms/Reassociate/reassociate-not-from-the-outside-of-the-loop.ll @@ -1,3 +1,4 @@ +; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 2 ; RUN: opt -passes=reassociate -S < %s \| FileCheck %s ; This test is to ensure that no computations are pulled into a loop @@ -9,12 +10,35 @@ ; Reassociate pass. define void @innermost_loop(i32 %i, double %d1, double %d2, double %delta, ptr %cells) { -; CHECK-LABEL: @innermost_loop( +; CHECK-LABEL: define void @innermost_loop +; CHECK-SAME: (i32 [[I:%.]], double [[D1:%.]], double [[D2:%.]], double [[DELTA:%.]], ptr [[CELLS:%.]]) { +; CHECK-NEXT: entry: +; CHECK-NEXT: [[MUL:%.]] = fmul fast double [[DELTA]], [[D1]] +; CHECK-NEXT: [[MUL1:%.]] = fmul fast double [[DELTA]], [[D2]] +; CHECK-NEXT: br label [[FOR_COND:%.]] +; CHECK: for.cond: +; CHECK-NEXT: [[J_0:%.]] = phi i32 [ 0, [[ENTRY:%.]] ], [ [[ADD:%.]], [[FOR_BODY:%.]] ] +; CHECK-NEXT: [[CMP_NOT:%.]] = icmp sgt i32 [[J_0]], [[I]] +; CHECK-NEXT: br i1 [[CMP_NOT]], label [[FOR_END:%.]], label [[FOR_BODY]] +; CHECK: for.body: +; CHECK-NEXT: [[ADD]] = add nuw nsw i32 [[J_0]], 1 +; CHECK-NEXT: [[IDXPROM:%.]] = zext i32 [[ADD]] to i64 +; CHECK-NEXT: [[ARRAYIDX:%.]] = getelementptr inbounds double, ptr [[CELLS]], i64 [[IDXPROM]] +; CHECK-NEXT: [[TMP0:%.]] = load double, ptr [[ARRAYIDX]], align 8 +; CHECK-NEXT: [[MUL2:%.]] = fmul fast double [[MUL]], [[TMP0]] +; CHECK-NEXT: [[IDXPROM3:%.]] = zext i32 [[J_0]] to i64 +; CHECK-NEXT: [[ARRAYIDX4:%.]] = getelementptr inbounds double, ptr [[CELLS]], i64 [[IDXPROM3]] +; CHECK-NEXT: [[TMP1:%.]] = load double, ptr [[ARRAYIDX4]], align 8 +; CHECK-NEXT: [[MUL5:%.]] = fmul fast double [[MUL1]], [[TMP1]] +; CHECK-NEXT: [[ADD6:%.]] = fadd fast double [[MUL5]], [[MUL2]] +; CHECK-NEXT: store double [[ADD6]], ptr [[ARRAYIDX4]], align 8 +; CHECK-NEXT: br label [[FOR_COND]] +; CHECK: for.end: +; CHECK-NEXT: ret void +; Is that what is expected here? It doesn't seem focusing on the matter of this patch, and it doesn't seem futureproof: many things not related to this patch can change that can affect this test case in this form... pawosm01:* It will make it look like this: ``` --- a/llvm/test/Transforms/Reassociate/reassociate-not…
				pawosm01AuthorUnsubmitted Done Reply Inline Actions ...and where those CHECK-NOT's has gone? pawosm01: ...and where those CHECK-NOT's has gone?

	; This test is to ensure that no computations are pulled into a loop			; This test is to ensure that no computations are pulled into a loop
	; by the Reassociate pass. Doing so can result in the loop invariants not being			; by the Reassociate pass. Doing so can result in the loop invariants not being
	; computed before the loop anymore. In case of this test, it would add an extra			; computed before the loop anymore. In case of this test, it would add an extra
	; multiplication into the loop.			; multiplication into the loop.

	; FIXME: the checks below need to be inverted to confirm the change to the			; FIXME: the checks below need to be inverted to confirm the change to the
	; Reassociate pass.			; Reassociate pass.

	define void @innermost_loop(i32 %i, double %d1, double %d2, double %delta, ptr %cells) {			define void @innermost_loop(i32 %i, double %d1, double %d2, double %delta, ptr %cells) {
	; CHECK-LABEL: @innermost_loop(			; CHECK-LABEL: define void @innermost_loop
				; CHECK-SAME: (i32 [[I:%.]], double [[D1:%.]], double [[D2:%.]], double [[DELTA:%.]], ptr [[CELLS:%.*]]) {
				; CHECK-NEXT: entry:
				; CHECK-NEXT: [[MUL:%.*]] = fmul fast double [[DELTA]], [[D1]]
				; CHECK-NEXT: [[MUL1:%.*]] = fmul fast double [[DELTA]], [[D2]]
				; CHECK-NEXT: br label [[FOR_COND:%.*]]
				; CHECK: for.cond:
				; CHECK-NEXT: [[J_0:%.]] = phi i32 [ 0, [[ENTRY:%.]] ], [ [[ADD:%.]], [[FOR_BODY:%.]] ]
				; CHECK-NEXT: [[CMP_NOT:%.*]] = icmp sgt i32 [[J_0]], [[I]]
				; CHECK-NEXT: br i1 [[CMP_NOT]], label [[FOR_END:%.*]], label [[FOR_BODY]]
				; CHECK: for.body:
				; CHECK-NEXT: [[ADD]] = add nuw nsw i32 [[J_0]], 1
				; CHECK-NEXT: [[IDXPROM:%.*]] = zext i32 [[ADD]] to i64
				; CHECK-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds double, ptr [[CELLS]], i64 [[IDXPROM]]
				; CHECK-NEXT: [[TMP0:%.*]] = load double, ptr [[ARRAYIDX]], align 8
				; CHECK-NEXT: [[MUL2:%.*]] = fmul fast double [[MUL]], [[TMP0]]
				; CHECK-NEXT: [[IDXPROM3:%.*]] = zext i32 [[J_0]] to i64
				; CHECK-NEXT: [[ARRAYIDX4:%.*]] = getelementptr inbounds double, ptr [[CELLS]], i64 [[IDXPROM3]]
				; CHECK-NEXT: [[TMP1:%.*]] = load double, ptr [[ARRAYIDX4]], align 8
				; CHECK-NEXT: [[MUL5:%.*]] = fmul fast double [[MUL1]], [[TMP1]]
				; CHECK-NEXT: [[ADD6:%.*]] = fadd fast double [[MUL5]], [[MUL2]]
				; CHECK-NEXT: store double [[ADD6]], ptr [[ARRAYIDX4]], align 8
				; CHECK-NEXT: br label [[FOR_COND]]
				; CHECK: for.end:
				; CHECK-NEXT: ret void
				;
	entry:			entry:
	; CHECK-LABEL: entry:
	%mul = fmul fast double %d1, %delta			%mul = fmul fast double %d1, %delta
	%mul1 = fmul fast double %d2, %delta			%mul1 = fmul fast double %d2, %delta
	; CHECK-NOT: %{{.}} = fmul {{.}} %delta
	br label %for.cond			br label %for.cond

	for.cond:			for.cond:
	%j.0 = phi i32 [ 0, %entry ], [ %add, %for.body ]			%j.0 = phi i32 [ 0, %entry ], [ %add, %for.body ]
	%cmp.not = icmp sgt i32 %j.0, %i			%cmp.not = icmp sgt i32 %j.0, %i
	br i1 %cmp.not, label %for.end, label %for.body			br i1 %cmp.not, label %for.end, label %for.body

	for.body:			for.body:
	; CHECK-LABEL: for.body:
	%add = add nuw nsw i32 %j.0, 1			%add = add nuw nsw i32 %j.0, 1
	%idxprom = zext i32 %add to i64			%idxprom = zext i32 %add to i64
	%arrayidx = getelementptr inbounds double, ptr %cells, i64 %idxprom			%arrayidx = getelementptr inbounds double, ptr %cells, i64 %idxprom
	%0 = load double, ptr %arrayidx			%0 = load double, ptr %arrayidx
	%mul2 = fmul fast double %mul, %0			%mul2 = fmul fast double %mul, %0
	%idxprom3 = zext i32 %j.0 to i64			%idxprom3 = zext i32 %j.0 to i64
	%arrayidx4 = getelementptr inbounds double, ptr %cells, i64 %idxprom3			%arrayidx4 = getelementptr inbounds double, ptr %cells, i64 %idxprom3
	%1 = load double, ptr %arrayidx4			%1 = load double, ptr %arrayidx4
	%mul5 = fmul fast double %mul1, %1			%mul5 = fmul fast double %mul1, %1
	%add6 = fadd fast double %mul2, %mul5			%add6 = fadd fast double %mul2, %mul5
	; CHECK: %reass{{.*}} = fadd
	; CHECK-NEXT: %reass{{.}} = fmul {{.}} %delta
	store double %add6, ptr %arrayidx4			store double %add6, ptr %arrayidx4
	br label %for.cond			br label %for.cond

	for.end:			for.end:
	ret void			ret void
	}			}

This is an archive of the discontinued LLVM Phabricator instance.

[Transforms][Reassociate] "Reassociate expressions" pass optimizations not always profitable
AbandonedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 526640

llvm/include/llvm/Transforms/Scalar/Reassociate.h

llvm/lib/Transforms/Scalar/Reassociate.cpp

llvm/test/Other/new-pm-defaults.ll

llvm/test/Other/new-pm-thinlto-postlink-defaults.ll

llvm/test/Other/new-pm-thinlto-prelink-defaults.ll

llvm/test/Transforms/Reassociate/reassociate-not-from-the-outside-of-the-loop.ll

This is an archive of the discontinued LLVM Phabricator instance.

[Transforms][Reassociate] "Reassociate expressions" pass optimizations not always profitableAbandonedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 526640

llvm/include/llvm/Transforms/Scalar/Reassociate.h

llvm/lib/Transforms/Scalar/Reassociate.cpp

llvm/test/Other/new-pm-defaults.ll

llvm/test/Other/new-pm-thinlto-postlink-defaults.ll

llvm/test/Other/new-pm-thinlto-prelink-defaults.ll

llvm/test/Transforms/Reassociate/reassociate-not-from-the-outside-of-the-loop.ll

[Transforms][Reassociate] "Reassociate expressions" pass optimizations not always profitable
AbandonedPublic