Diff 173825

include/llvm/Analysis/VectorUtils.h

Show All 18 Lines
#include "llvm/Analysis/TargetLibraryInfo.h"		#include "llvm/Analysis/TargetLibraryInfo.h"
#include "llvm/IR/IRBuilder.h"		#include "llvm/IR/IRBuilder.h"

namespace llvm {		namespace llvm {

template <typename T> class ArrayRef;		template <typename T> class ArrayRef;
class DemandedBits;		class DemandedBits;
class GetElementPtrInst;		class GetElementPtrInst;
class InterleaveGroup;		template <typename InstTy> class InterleaveGroup;
class Loop;		class Loop;
class ScalarEvolution;		class ScalarEvolution;
class TargetTransformInfo;		class TargetTransformInfo;
class Type;		class Type;
class Value;		class Value;

namespace Intrinsic {		namespace Intrinsic {
enum ID : unsigned;		enum ID : unsigned;
▲ Show 20 Lines • Show All 97 Lines • ▼ Show 20 Lines
/// and \p VF 4, that has only its first member present is:		/// and \p VF 4, that has only its first member present is:
///		///
/// <1,0,0,1,0,0,1,0,0,1,0,0>		/// <1,0,0,1,0,0,1,0,0,1,0,0>
///		///
/// Note: The result is a mask of 0's and 1's, as opposed to the other		/// Note: The result is a mask of 0's and 1's, as opposed to the other
/// create[*]Mask() utilities which create a shuffle mask (mask that		/// create[*]Mask() utilities which create a shuffle mask (mask that
/// consists of indices).		/// consists of indices).
Constant *createBitMaskForGaps(IRBuilder<> &Builder, unsigned VF,		Constant *createBitMaskForGaps(IRBuilder<> &Builder, unsigned VF,
const InterleaveGroup &Group);		const InterleaveGroup<Instruction> &Group);

/// Create a mask with replicated elements.		/// Create a mask with replicated elements.
///		///
/// This function creates a shuffle mask for replicating each of the \p VF		/// This function creates a shuffle mask for replicating each of the \p VF
/// elements in a vector \p ReplicationFactor times. It can be used to		/// elements in a vector \p ReplicationFactor times. It can be used to
/// transform a mask of \p VF elements into a mask of		/// transform a mask of \p VF elements into a mask of
/// \p VF * \p ReplicationFactor elements used by a predicated		/// \p VF * \p ReplicationFactor elements used by a predicated
/// interleaved-group of loads/stores whose Interleaved-factor ==		/// interleaved-group of loads/stores whose Interleaved-factor ==
▲ Show 20 Lines • Show All 78 Lines • ▼ Show 20 Lines
/// A[i] = a; // Member of index 0		/// A[i] = a; // Member of index 0
/// A[i+1] = b; // Member of index 1		/// A[i+1] = b; // Member of index 1
/// A[i+2] = c; // Member of index 2		/// A[i+2] = c; // Member of index 2
/// A[i+3] = d; // Member of index 3		/// A[i+3] = d; // Member of index 3
/// }		/// }
///		///
/// Note: the interleaved load group could have gaps (missing members), but		/// Note: the interleaved load group could have gaps (missing members), but
/// the interleaved store group doesn't allow gaps.		/// the interleaved store group doesn't allow gaps.
class InterleaveGroup {		template <typename InstTy> class InterleaveGroup {
public:		public:
InterleaveGroup(Instruction *Instr, int Stride, unsigned Align)		InterleaveGroup(unsigned Factor, bool Reverse, unsigned Align)
		: Factor(Factor), Reverse(Reverse), Align(Align), InsertPos(nullptr) {}

		InterleaveGroup(InstTy *Instr, int Stride, unsigned Align)
: Align(Align), InsertPos(Instr) {		: Align(Align), InsertPos(Instr) {
assert(Align && "The alignment should be non-zero");		assert(Align && "The alignment should be non-zero");

Factor = std::abs(Stride);		Factor = std::abs(Stride);
assert(Factor > 1 && "Invalid interleave factor");		assert(Factor > 1 && "Invalid interleave factor");

Reverse = Stride < 0;		Reverse = Stride < 0;
Members[0] = Instr;		Members[0] = Instr;
}		}

bool isReverse() const { return Reverse; }		bool isReverse() const { return Reverse; }
unsigned getFactor() const { return Factor; }		unsigned getFactor() const { return Factor; }
unsigned getAlignment() const { return Align; }		unsigned getAlignment() const { return Align; }
unsigned getNumMembers() const { return Members.size(); }		unsigned getNumMembers() const { return Members.size(); }

/// Try to insert a new member \p Instr with index \p Index and		/// Try to insert a new member \p Instr with index \p Index and
/// alignment \p NewAlign. The index is related to the leader and it could be		/// alignment \p NewAlign. The index is related to the leader and it could be
/// negative if it is the new leader.		/// negative if it is the new leader.
///		///
/// \returns false if the instruction doesn't belong to the group.		/// \returns false if the instruction doesn't belong to the group.
bool insertMember(Instruction *Instr, int Index, unsigned NewAlign) {		bool insertMember(InstTy *Instr, int Index, unsigned NewAlign) {
assert(NewAlign && "The new member's alignment should be non-zero");		assert(NewAlign && "The new member's alignment should be non-zero");

int Key = Index + SmallestKey;		int Key = Index + SmallestKey;

// Skip if there is already a member with the same index.		// Skip if there is already a member with the same index.
if (Members.find(Key) != Members.end())		if (Members.find(Key) != Members.end())
return false;		return false;

Show All 15 Lines	bool insertMember(InstTy *Instr, int Index, unsigned NewAlign) {
Align = std::min(Align, NewAlign);		Align = std::min(Align, NewAlign);
Members[Key] = Instr;		Members[Key] = Instr;
return true;		return true;
}		}

/// Get the member with the given index \p Index		/// Get the member with the given index \p Index
///		///
/// \returns nullptr if contains no such member.		/// \returns nullptr if contains no such member.
Instruction *getMember(unsigned Index) const {		InstTy *getMember(unsigned Index) const {
int Key = SmallestKey + Index;		int Key = SmallestKey + Index;
auto Member = Members.find(Key);		auto Member = Members.find(Key);
if (Member == Members.end())		if (Member == Members.end())
return nullptr;		return nullptr;

return Member->second;		return Member->second;
}		}

/// Get the index for the given member. Unlike the key in the member		/// Get the index for the given member. Unlike the key in the member
/// map, the index starts from 0.		/// map, the index starts from 0.
unsigned getIndex(Instruction *Instr) const {		unsigned getIndex(const InstTy *Instr) const {
for (auto I : Members)		for (auto I : Members) {
if (I.second == Instr)		if (I.second == Instr)
return I.first - SmallestKey;		return I.first - SmallestKey;
		}

llvm_unreachable("InterleaveGroup contains no such member");		llvm_unreachable("InterleaveGroup contains no such member");
}		}

Instruction *getInsertPos() const { return InsertPos; }		InstTy *getInsertPos() const { return InsertPos; }
void setInsertPos(Instruction *Inst) { InsertPos = Inst; }		void setInsertPos(InstTy *Inst) { InsertPos = Inst; }

/// Add metadata (e.g. alias info) from the instructions in this group to \p		/// Add metadata (e.g. alias info) from the instructions in this group to \p
/// NewInst.		/// NewInst.
///		///
/// FIXME: this function currently does not add noalias metadata a'la		/// FIXME: this function currently does not add noalias metadata a'la
/// addNewMedata. To do that we need to compute the intersection of the		/// addNewMedata. To do that we need to compute the intersection of the
/// noalias info from all members.		/// noalias info from all members.
void addMetadata(Instruction *NewInst) const {		void addMetadata(InstTy *NewInst) const;
SmallVector<Value *, 4> VL;
std::transform(Members.begin(), Members.end(), std::back_inserter(VL),
[](std::pair<int, Instruction *> p) { return p.second; });
propagateMetadata(NewInst, VL);
}

/// Returns true if this Group requires a scalar iteration to handle gaps.		/// Returns true if this Group requires a scalar iteration to handle gaps.
bool requiresScalarEpilogue() const {		bool requiresScalarEpilogue() const {
// If the last member of the Group exists, then a scalar epilog is not		// If the last member of the Group exists, then a scalar epilog is not
// needed for this group.		// needed for this group.
if (getMember(getFactor() - 1))		if (getMember(getFactor() - 1))
return false;		return false;

// We have a group with gaps. It therefore cannot be a group of stores,		// We have a group with gaps. It therefore cannot be a group of stores,
// and it can't be a reversed access, because such groups get invalidated.		// and it can't be a reversed access, because such groups get invalidated.
assert(!getMember(0)->mayWriteToMemory() &&		assert(!getMember(0)->mayWriteToMemory() &&
"Group should have been invalidated");		"Group should have been invalidated");
assert(!isReverse() && "Group should have been invalidated");		assert(!isReverse() && "Group should have been invalidated");

// This is a group of loads, with gaps, and without a last-member		// This is a group of loads, with gaps, and without a last-member
return true;		return true;
}		}

private:		private:
unsigned Factor; // Interleave Factor.		unsigned Factor; // Interleave Factor.
bool Reverse;		bool Reverse;
unsigned Align;		unsigned Align;
DenseMap<int, Instruction *> Members;		DenseMap<int, InstTy *> Members;
int SmallestKey = 0;		int SmallestKey = 0;
int LargestKey = 0;		int LargestKey = 0;

// To avoid breaking dependences, vectorized instructions of an interleave		// To avoid breaking dependences, vectorized instructions of an interleave
// group should be inserted at either the first load or the last store in		// group should be inserted at either the first load or the last store in
// program order.		// program order.
//		//
// E.g. %even = load i32 // Insert Position		// E.g. %even = load i32 // Insert Position
// %add = add i32 %even // Use of %even		// %add = add i32 %even // Use of %even
// %odd = load i32		// %odd = load i32
//		//
// store i32 %even		// store i32 %even
// %odd = add i32 // Def of %odd		// %odd = add i32 // Def of %odd
// store i32 %odd // Insert Position		// store i32 %odd // Insert Position
Instruction *InsertPos;		InstTy *InsertPos;
};		};

/// Drive the analysis of interleaved memory accesses in the loop.		/// Drive the analysis of interleaved memory accesses in the loop.
///		///
/// Use this class to analyze interleaved accesses only when we can vectorize		/// Use this class to analyze interleaved accesses only when we can vectorize
/// a loop. Otherwise it's meaningless to do analysis as the vectorization		/// a loop. Otherwise it's meaningless to do analysis as the vectorization
/// on interleaved accesses is unsafe.		/// on interleaved accesses is unsafe.
///		///
Show All 14 Lines	public:
/// \p EnableMaskedInterleavedGroup is true.		/// \p EnableMaskedInterleavedGroup is true.
void analyzeInterleaving(bool EnableMaskedInterleavedGroup);		void analyzeInterleaving(bool EnableMaskedInterleavedGroup);

/// Invalidate groups, e.g., in case all blocks in loop will be predicated		/// Invalidate groups, e.g., in case all blocks in loop will be predicated
/// contrary to original assumption. Although we currently prevent group		/// contrary to original assumption. Although we currently prevent group
/// formation for predicated accesses, we may be able to relax this limitation		/// formation for predicated accesses, we may be able to relax this limitation
/// in the future once we handle more complicated blocks.		/// in the future once we handle more complicated blocks.
void reset() {		void reset() {
SmallPtrSet<InterleaveGroup *, 4> DelSet;		SmallPtrSet<InterleaveGroup<Instruction> *, 4> DelSet;
// Avoid releasing a pointer twice.		// Avoid releasing a pointer twice.
for (auto &I : InterleaveGroupMap)		for (auto &I : InterleaveGroupMap)
DelSet.insert(I.second);		DelSet.insert(I.second);
for (auto *Ptr : DelSet)		for (auto *Ptr : DelSet)
delete Ptr;		delete Ptr;
InterleaveGroupMap.clear();		InterleaveGroupMap.clear();
RequiresScalarEpilogue = false;		RequiresScalarEpilogue = false;
}		}


/// Check if \p Instr belongs to any interleave group.		/// Check if \p Instr belongs to any interleave group.
bool isInterleaved(Instruction *Instr) const {		bool isInterleaved(Instruction *Instr) const {
return InterleaveGroupMap.find(Instr) != InterleaveGroupMap.end();		return InterleaveGroupMap.find(Instr) != InterleaveGroupMap.end();
}		}

/// Get the interleave group that \p Instr belongs to.		/// Get the interleave group that \p Instr belongs to.
///		///
/// \returns nullptr if doesn't have such group.		/// \returns nullptr if doesn't have such group.
InterleaveGroup getInterleaveGroup(Instruction Instr) const {		InterleaveGroup<Instruction> *
auto Group = InterleaveGroupMap.find(Instr);		getInterleaveGroup(const Instruction *Instr) const {
if (Group == InterleaveGroupMap.end())		if (InterleaveGroupMap.count(Instr))
		return InterleaveGroupMap.find(Instr)->second;
return nullptr;		return nullptr;
return Group->second;		}

		iterator_range<SmallPtrSetIterator<llvm::InterleaveGroup<Instruction> *>>
		getInterleaveGroups() {
		return make_range(InterleaveGroups.begin(), InterleaveGroups.end());
}		}

/// Returns true if an interleaved group that may access memory		/// Returns true if an interleaved group that may access memory
/// out-of-bounds requires a scalar epilogue iteration for correctness.		/// out-of-bounds requires a scalar epilogue iteration for correctness.
bool requiresScalarEpilogue() const { return RequiresScalarEpilogue; }		bool requiresScalarEpilogue() const { return RequiresScalarEpilogue; }

/// Invalidate groups that require a scalar epilogue (due to gaps). This can		/// Invalidate groups that require a scalar epilogue (due to gaps). This can
/// happen when optimizing for size forbids a scalar epilogue, and the gap		/// happen when optimizing for size forbids a scalar epilogue, and the gap
Show All 13 Lines	private:
const LoopAccessInfo *LAI;		const LoopAccessInfo *LAI;

/// True if the loop may contain non-reversed interleaved groups with		/// True if the loop may contain non-reversed interleaved groups with
/// out-of-bounds accesses. We ensure we don't speculatively access memory		/// out-of-bounds accesses. We ensure we don't speculatively access memory
/// out-of-bounds by executing at least one scalar epilogue iteration.		/// out-of-bounds by executing at least one scalar epilogue iteration.
bool RequiresScalarEpilogue = false;		bool RequiresScalarEpilogue = false;

/// Holds the relationships between the members and the interleave group.		/// Holds the relationships between the members and the interleave group.
DenseMap<Instruction , InterleaveGroup > InterleaveGroupMap;		DenseMap<Instruction , InterleaveGroup<Instruction> > InterleaveGroupMap;

		SmallPtrSet<InterleaveGroup<Instruction> *, 4> InterleaveGroups;

/// Holds dependences among the memory accesses in the loop. It maps a source		/// Holds dependences among the memory accesses in the loop. It maps a source
/// access to a set of dependent sink accesses.		/// access to a set of dependent sink accesses.
DenseMap<Instruction , SmallPtrSet<Instruction , 2>> Dependences;		DenseMap<Instruction , SmallPtrSet<Instruction , 2>> Dependences;

/// The descriptor for a strided memory access.		/// The descriptor for a strided memory access.
struct StrideDescriptor {		struct StrideDescriptor {
StrideDescriptor() = default;		StrideDescriptor() = default;
Show All 16 Lines	private:

/// A type for holding instructions and their stride descriptors.		/// A type for holding instructions and their stride descriptors.
using StrideEntry = std::pair<Instruction *, StrideDescriptor>;		using StrideEntry = std::pair<Instruction *, StrideDescriptor>;

/// Create a new interleave group with the given instruction \p Instr,		/// Create a new interleave group with the given instruction \p Instr,
/// stride \p Stride and alignment \p Align.		/// stride \p Stride and alignment \p Align.
///		///
/// \returns the newly created interleave group.		/// \returns the newly created interleave group.
InterleaveGroup createInterleaveGroup(Instruction Instr, int Stride,		InterleaveGroup<Instruction> *
unsigned Align) {		createInterleaveGroup(Instruction *Instr, int Stride, unsigned Align) {
assert(!isInterleaved(Instr) && "Already in an interleaved access group");		assert(!InterleaveGroupMap.count(Instr) &&
InterleaveGroupMap[Instr] = new InterleaveGroup(Instr, Stride, Align);		"Already in an interleaved access group");
		InterleaveGroupMap[Instr] =
		new InterleaveGroup<Instruction>(Instr, Stride, Align);
		InterleaveGroups.insert(InterleaveGroupMap[Instr]);
return InterleaveGroupMap[Instr];		return InterleaveGroupMap[Instr];
}		}

/// Release the group and remove all the relationships.		/// Release the group and remove all the relationships.
void releaseGroup(InterleaveGroup *Group) {		void releaseGroup(InterleaveGroup<Instruction> *Group) {
for (unsigned i = 0; i < Group->getFactor(); i++)		for (unsigned i = 0; i < Group->getFactor(); i++)
if (Instruction *Member = Group->getMember(i))		if (Instruction *Member = Group->getMember(i))
InterleaveGroupMap.erase(Member);		InterleaveGroupMap.erase(Member);

		InterleaveGroups.erase(Group);
delete Group;		delete Group;
}		}

/// Collect all the accesses with a constant stride in program order.		/// Collect all the accesses with a constant stride in program order.
void collectConstStrideAccesses(		void collectConstStrideAccesses(
MapVector<Instruction *, StrideDescriptor> &AccessStrideInfo,		MapVector<Instruction *, StrideDescriptor> &AccessStrideInfo,
const ValueToValueMap &Strides);		const ValueToValueMap &Strides);

▲ Show 20 Lines • Show All 78 Lines • Show Last 20 Lines

lib/Analysis/VectorUtils.cpp

Show First 20 Lines • Show All 499 Lines • ▼ Show 20 Lines	for (auto Kind :
}		}

Inst->setMetadata(Kind, MD);		Inst->setMetadata(Kind, MD);
}		}

return Inst;		return Inst;
}		}

Constant *llvm::createBitMaskForGaps(IRBuilder<> &Builder, unsigned VF,		Constant *
const InterleaveGroup &Group) {		llvm::createBitMaskForGaps(IRBuilder<> &Builder, unsigned VF,
		const InterleaveGroup<Instruction> &Group) {
// All 1's means mask is not needed.		// All 1's means mask is not needed.
if (Group.getNumMembers() == Group.getFactor())		if (Group.getNumMembers() == Group.getFactor())
return nullptr;		return nullptr;

// TODO: support reversed access.		// TODO: support reversed access.
assert(!Group.isReverse() && "Reversed group not supported.");		assert(!Group.isReverse() && "Reversed group not supported.");

SmallVector<Constant *, 16> Mask;		SmallVector<Constant *, 16> Mask;
▲ Show 20 Lines • Show All 197 Lines • ▼ Show 20 Lines	void InterleavedAccessInfo::analyzeInterleaving(

if (AccessStrideInfo.empty())		if (AccessStrideInfo.empty())
return;		return;

// Collect the dependences in the loop.		// Collect the dependences in the loop.
collectDependences();		collectDependences();

// Holds all interleaved store groups temporarily.		// Holds all interleaved store groups temporarily.
SmallSetVector<InterleaveGroup *, 4> StoreGroups;		SmallSetVector<InterleaveGroup<Instruction> *, 4> StoreGroups;
// Holds all interleaved load groups temporarily.		// Holds all interleaved load groups temporarily.
SmallSetVector<InterleaveGroup *, 4> LoadGroups;		SmallSetVector<InterleaveGroup<Instruction> *, 4> LoadGroups;

// Search in bottom-up program order for pairs of accesses (A and B) that can		// Search in bottom-up program order for pairs of accesses (A and B) that can
// form interleaved load or store groups. In the algorithm below, access A		// form interleaved load or store groups. In the algorithm below, access A
// precedes access B in program order. We initialize a group for B in the		// precedes access B in program order. We initialize a group for B in the
// outer loop of the algorithm, and then in the inner loop, we attempt to		// outer loop of the algorithm, and then in the inner loop, we attempt to
// insert each A into B's group if:		// insert each A into B's group if:
//		//
// 1. A and B have the same stride,		// 1. A and B have the same stride,
// 2. A and B have the same memory object size, and		// 2. A and B have the same memory object size, and
// 3. A belongs in B's group according to its distance from B.		// 3. A belongs in B's group according to its distance from B.
//		//
// Special care is taken to ensure group formation will not break any		// Special care is taken to ensure group formation will not break any
// dependences.		// dependences.
for (auto BI = AccessStrideInfo.rbegin(), E = AccessStrideInfo.rend();		for (auto BI = AccessStrideInfo.rbegin(), E = AccessStrideInfo.rend();
BI != E; ++BI) {		BI != E; ++BI) {
Instruction *B = BI->first;		Instruction *B = BI->first;
StrideDescriptor DesB = BI->second;		StrideDescriptor DesB = BI->second;

// Initialize a group for B if it has an allowable stride. Even if we don't		// Initialize a group for B if it has an allowable stride. Even if we don't
// create a group for B, we continue with the bottom-up algorithm to ensure		// create a group for B, we continue with the bottom-up algorithm to ensure
// we don't break any of B's dependences.		// we don't break any of B's dependences.
InterleaveGroup *Group = nullptr;		InterleaveGroup<Instruction> *Group = nullptr;
if (isStrided(DesB.Stride) &&		if (isStrided(DesB.Stride) &&
(!isPredicated(B->getParent()) \|\| EnablePredicatedInterleavedMemAccesses)) {		(!isPredicated(B->getParent()) \|\| EnablePredicatedInterleavedMemAccesses)) {
Group = getInterleaveGroup(B);		Group = getInterleaveGroup(B);
if (!Group) {		if (!Group) {
LLVM_DEBUG(dbgs() << "LV: Creating an interleave group with:" << *B		LLVM_DEBUG(dbgs() << "LV: Creating an interleave group with:" << *B
<< '\n');		<< '\n');
Group = createInterleaveGroup(B, DesB.Stride, DesB.Align);		Group = createInterleaveGroup(B, DesB.Stride, DesB.Align);
}		}
Show All 28 Lines	for (auto AI = std::next(BI); AI != E; ++AI) {
// the boundaries of the (2, 4) group.		// the boundaries of the (2, 4) group.
if (!canReorderMemAccessesForInterleavedGroups(&AI, &BI)) {		if (!canReorderMemAccessesForInterleavedGroups(&AI, &BI)) {
// If a dependence exists and A is already in a group, we know that A		// If a dependence exists and A is already in a group, we know that A
// must be a store since A precedes B and WAR dependences are allowed.		// must be a store since A precedes B and WAR dependences are allowed.
// Thus, A would be sunk below B. We release A's group to prevent this		// Thus, A would be sunk below B. We release A's group to prevent this
// illegal code motion. A will then be free to form another group with		// illegal code motion. A will then be free to form another group with
// instructions that precede it.		// instructions that precede it.
if (isInterleaved(A)) {		if (isInterleaved(A)) {
InterleaveGroup *StoreGroup = getInterleaveGroup(A);		InterleaveGroup<Instruction> *StoreGroup = getInterleaveGroup(A);
StoreGroups.remove(StoreGroup);		StoreGroups.remove(StoreGroup);
releaseGroup(StoreGroup);		releaseGroup(StoreGroup);
}		}

// If a dependence exists and A is not already in a group (or it was		// If a dependence exists and A is not already in a group (or it was
// and we just released it), B might be hoisted above A (if B is a		// and we just released it), B might be hoisted above A (if B is a
// load) or another store might be sunk below A (if B is a store). In		// load) or another store might be sunk below A (if B is a store). In
// either case, we can't add additional instructions to B's group. B		// either case, we can't add additional instructions to B's group. B
▲ Show 20 Lines • Show All 62 Lines • ▼ Show 20 Lines	for (auto AI = std::next(BI); AI != E; ++AI) {
// Set the first load in program order as the insert position.		// Set the first load in program order as the insert position.
if (A->mayReadFromMemory())		if (A->mayReadFromMemory())
Group->setInsertPos(A);		Group->setInsertPos(A);
}		}
} // Iteration over A accesses.		} // Iteration over A accesses.
} // Iteration over B accesses.		} // Iteration over B accesses.

// Remove interleaved store groups with gaps.		// Remove interleaved store groups with gaps.
for (InterleaveGroup *Group : StoreGroups)		for (auto *Group : StoreGroups)
if (Group->getNumMembers() != Group->getFactor()) {		if (Group->getNumMembers() != Group->getFactor()) {
LLVM_DEBUG(		LLVM_DEBUG(
dbgs() << "LV: Invalidate candidate interleaved store group due "		dbgs() << "LV: Invalidate candidate interleaved store group due "
"to gaps.\n");		"to gaps.\n");
releaseGroup(Group);		releaseGroup(Group);
}		}
// Remove interleaved groups with gaps (currently only loads) whose memory		// Remove interleaved groups with gaps (currently only loads) whose memory
// accesses may wrap around. We have to revisit the getPtrStride analysis,		// accesses may wrap around. We have to revisit the getPtrStride analysis,
// this time with ShouldCheckWrap=true, since collectConstStrideAccesses does		// this time with ShouldCheckWrap=true, since collectConstStrideAccesses does
// not check wrapping (see documentation there).		// not check wrapping (see documentation there).
// FORNOW we use Assume=false;		// FORNOW we use Assume=false;
// TODO: Change to Assume=true but making sure we don't exceed the threshold		// TODO: Change to Assume=true but making sure we don't exceed the threshold
// of runtime SCEV assumptions checks (thereby potentially failing to		// of runtime SCEV assumptions checks (thereby potentially failing to
// vectorize altogether).		// vectorize altogether).
// Additional optional optimizations:		// Additional optional optimizations:
// TODO: If we are peeling the loop and we know that the first pointer doesn't		// TODO: If we are peeling the loop and we know that the first pointer doesn't
// wrap then we can deduce that all pointers in the group don't wrap.		// wrap then we can deduce that all pointers in the group don't wrap.
// This means that we can forcefully peel the loop in order to only have to		// This means that we can forcefully peel the loop in order to only have to
// check the first pointer for no-wrap. When we'll change to use Assume=true		// check the first pointer for no-wrap. When we'll change to use Assume=true
// we'll only need at most one runtime check per interleaved group.		// we'll only need at most one runtime check per interleaved group.
for (InterleaveGroup *Group : LoadGroups) {		for (auto *Group : LoadGroups) {
// Case 1: A full group. Can Skip the checks; For full groups, if the wide		// Case 1: A full group. Can Skip the checks; For full groups, if the wide
// load would wrap around the address space we would do a memory access at		// load would wrap around the address space we would do a memory access at
// nullptr even without the transformation.		// nullptr even without the transformation.
if (Group->getNumMembers() == Group->getFactor())		if (Group->getNumMembers() == Group->getFactor())
continue;		continue;

// Case 2: If first and last members of the group don't wrap this implies		// Case 2: If first and last members of the group don't wrap this implies
// that all the pointers in the group don't wrap.		// that all the pointers in the group don't wrap.
▲ Show 20 Lines • Show All 41 Lines • ▼ Show 20 Lines

void InterleavedAccessInfo::invalidateGroupsRequiringScalarEpilogue() {		void InterleavedAccessInfo::invalidateGroupsRequiringScalarEpilogue() {
// If no group had triggered the requirement to create an epilogue loop,		// If no group had triggered the requirement to create an epilogue loop,
// there is nothing to do.		// there is nothing to do.
if (!requiresScalarEpilogue())		if (!requiresScalarEpilogue())
return;		return;

// Avoid releasing a Group twice.		// Avoid releasing a Group twice.
SmallPtrSet<InterleaveGroup *, 4> DelSet;		SmallPtrSet<InterleaveGroup<Instruction> *, 4> DelSet;
for (auto &I : InterleaveGroupMap) {		for (auto &I : InterleaveGroupMap) {
InterleaveGroup *Group = I.second;		InterleaveGroup<Instruction> *Group = I.second;
if (Group->requiresScalarEpilogue())		if (Group->requiresScalarEpilogue())
DelSet.insert(Group);		DelSet.insert(Group);
}		}
for (auto *Ptr : DelSet) {		for (auto *Ptr : DelSet) {
LLVM_DEBUG(		LLVM_DEBUG(
dbgs()		dbgs()
<< "LV: Invalidate candidate interleaved group due to gaps that "		<< "LV: Invalidate candidate interleaved group due to gaps that "
"require a scalar epilogue (not allowed under optsize) and cannot "		"require a scalar epilogue (not allowed under optsize) and cannot "
"be masked (not enabled). \n");		"be masked (not enabled). \n");
releaseGroup(Ptr);		releaseGroup(Ptr);
}		}

RequiresScalarEpilogue = false;		RequiresScalarEpilogue = false;
}		}

		template <>
		void InterleaveGroup<Instruction>::addMetadata(Instruction *NewInst) const {
		SmallVector<Value *, 4> VL;
		std::transform(Members.begin(), Members.end(), std::back_inserter(VL),
		[](std::pair<int, Instruction *> p) { return p.second; });
		propagateMetadata(NewInst, VL);
		}

		template <typename InstT>
		void InterleaveGroup<InstT>::addMetadata(InstT *NewInst) const {
		llvm_unreachable("addMetadata can only be used for Instruction");
		}

lib/Transforms/Vectorize/LoopVectorize.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

Show First 20 Lines • Show All 970 Lines • ▼ Show 20 Lines	public:
void setWideningDecision(Instruction *I, unsigned VF, InstWidening W,		void setWideningDecision(Instruction *I, unsigned VF, InstWidening W,
unsigned Cost) {		unsigned Cost) {
assert(VF >= 2 && "Expected VF >=2");		assert(VF >= 2 && "Expected VF >=2");
WideningDecisions[std::make_pair(I, VF)] = std::make_pair(W, Cost);		WideningDecisions[std::make_pair(I, VF)] = std::make_pair(W, Cost);
}		}

/// Save vectorization decision \p W and \p Cost taken by the cost model for		/// Save vectorization decision \p W and \p Cost taken by the cost model for
/// interleaving group \p Grp and vector width \p VF.		/// interleaving group \p Grp and vector width \p VF.
void setWideningDecision(const InterleaveGroup *Grp, unsigned VF,		void setWideningDecision(const InterleaveGroup<Instruction> *Grp, unsigned VF,
InstWidening W, unsigned Cost) {		InstWidening W, unsigned Cost) {
assert(VF >= 2 && "Expected VF >=2");		assert(VF >= 2 && "Expected VF >=2");
/// Broadcast this decicion to all instructions inside the group.		/// Broadcast this decicion to all instructions inside the group.
/// But the cost will be assigned to one instruction only.		/// But the cost will be assigned to one instruction only.
for (unsigned i = 0; i < Grp->getFactor(); ++i) {		for (unsigned i = 0; i < Grp->getFactor(); ++i) {
if (auto *I = Grp->getMember(i)) {		if (auto *I = Grp->getMember(i)) {
if (Grp->getInsertPos() == I)		if (Grp->getInsertPos() == I)
WideningDecisions[std::make_pair(I, VF)] = std::make_pair(W, Cost);		WideningDecisions[std::make_pair(I, VF)] = std::make_pair(W, Cost);
▲ Show 20 Lines • Show All 138 Lines • ▼ Show 20 Lines	public:
bool interleavedAccessCanBeWidened(Instruction *I, unsigned VF = 1);		bool interleavedAccessCanBeWidened(Instruction *I, unsigned VF = 1);

/// Check if \p Instr belongs to any interleaved access group.		/// Check if \p Instr belongs to any interleaved access group.
bool isAccessInterleaved(Instruction *Instr) {		bool isAccessInterleaved(Instruction *Instr) {
return InterleaveInfo.isInterleaved(Instr);		return InterleaveInfo.isInterleaved(Instr);
}		}

/// Get the interleaved access group that \p Instr belongs to.		/// Get the interleaved access group that \p Instr belongs to.
const InterleaveGroup getInterleavedAccessGroup(Instruction Instr) {		const InterleaveGroup<Instruction> *
		getInterleavedAccessGroup(Instruction *Instr) {
return InterleaveInfo.getInterleaveGroup(Instr);		return InterleaveInfo.getInterleaveGroup(Instr);
}		}

/// Returns true if an interleaved group requires a scalar iteration		/// Returns true if an interleaved group requires a scalar iteration
/// to handle accesses with gaps, and there is nothing preventing us from		/// to handle accesses with gaps, and there is nothing preventing us from
/// creating a scalar epilogue.		/// creating a scalar epilogue.
bool requiresScalarEpilogue() const {		bool requiresScalarEpilogue() const {
return IsScalarEpilogueAllowed && InterleaveInfo.requiresScalarEpilogue();		return IsScalarEpilogueAllowed && InterleaveInfo.requiresScalarEpilogue();
▲ Show 20 Lines • Show All 846 Lines • ▼ Show 20 Lines
// To:		// To:
// %R_G.vec = shuffle %R.vec, %G.vec, <0, 1, 2, ..., 7>		// %R_G.vec = shuffle %R.vec, %G.vec, <0, 1, 2, ..., 7>
// %B_U.vec = shuffle %B.vec, undef, <0, 1, 2, 3, u, u, u, u>		// %B_U.vec = shuffle %B.vec, undef, <0, 1, 2, 3, u, u, u, u>
// %interleaved.vec = shuffle %R_G.vec, %B_U.vec,		// %interleaved.vec = shuffle %R_G.vec, %B_U.vec,
// <0, 4, 8, 1, 5, 9, 2, 6, 10, 3, 7, 11> ; Interleave R,G,B elements		// <0, 4, 8, 1, 5, 9, 2, 6, 10, 3, 7, 11> ; Interleave R,G,B elements
// store <12 x i32> %interleaved.vec ; Write 4 tuples of R,G,B		// store <12 x i32> %interleaved.vec ; Write 4 tuples of R,G,B
void InnerLoopVectorizer::vectorizeInterleaveGroup(Instruction *Instr,		void InnerLoopVectorizer::vectorizeInterleaveGroup(Instruction *Instr,
VectorParts *BlockInMask) {		VectorParts *BlockInMask) {
const InterleaveGroup *Group = Cost->getInterleavedAccessGroup(Instr);		const InterleaveGroup<Instruction> *Group =
		Cost->getInterleavedAccessGroup(Instr);
assert(Group && "Fail to get an interleaved access group.");		assert(Group && "Fail to get an interleaved access group.");

// Skip if current instruction is not the insert position.		// Skip if current instruction is not the insert position.
if (Instr != Group->getInsertPos())		if (Instr != Group->getInsertPos())
return;		return;

const DataLayout &DL = Instr->getModule()->getDataLayout();		const DataLayout &DL = Instr->getModule()->getDataLayout();
Value *Ptr = getLoadStorePointerOperand(Instr);		Value *Ptr = getLoadStorePointerOperand(Instr);
▲ Show 20 Lines • Show All 4,366 Lines • ▼ Show 20 Lines	VPValue VPRecipeBuilder::createBlockInMask(BasicBlock BB, VPlanPtr &Plan) {
}		}

return BlockMaskCache[BB] = BlockMask;		return BlockMaskCache[BB] = BlockMask;
}		}

VPInterleaveRecipe VPRecipeBuilder::tryToInterleaveMemory(Instruction I,		VPInterleaveRecipe VPRecipeBuilder::tryToInterleaveMemory(Instruction I,
VFRange &Range,		VFRange &Range,
VPlanPtr &Plan) {		VPlanPtr &Plan) {
const InterleaveGroup *IG = CM.getInterleavedAccessGroup(I);		const InterleaveGroup<Instruction> *IG = CM.getInterleavedAccessGroup(I);
if (!IG)		if (!IG)
return nullptr;		return nullptr;

// Now check if IG is relevant for VF's in the given range.		// Now check if IG is relevant for VF's in the given range.
auto isIGMember = [&](Instruction *I) -> std::function<bool(unsigned)> {		auto isIGMember = [&](Instruction *I) -> std::function<bool(unsigned)> {
return [=](unsigned VF) -> bool {		return [=](unsigned VF) -> bool {
return (VF >= 2 && // Query is illegal for VF == 1		return (VF >= 2 && // Query is illegal for VF == 1
CM.getWideningDecision(I, VF) ==		CM.getWideningDecision(I, VF) ==
▲ Show 20 Lines • Show All 399 Lines • ▼ Show 20 Lines	for (Instruction &I : BB->instructionsWithoutDebug()) {
// First filter out irrelevant instructions, to ensure no recipes are		// First filter out irrelevant instructions, to ensure no recipes are
// built for them.		// built for them.
if (isa<BranchInst>(Instr) \|\|		if (isa<BranchInst>(Instr) \|\|
DeadInstructions.find(Instr) != DeadInstructions.end())		DeadInstructions.find(Instr) != DeadInstructions.end())
continue;		continue;

// I is a member of an InterleaveGroup for Range.Start. If it's an adjunct		// I is a member of an InterleaveGroup for Range.Start. If it's an adjunct
// member of the IG, do not construct any Recipe for it.		// member of the IG, do not construct any Recipe for it.
const InterleaveGroup *IG = CM.getInterleavedAccessGroup(Instr);		const InterleaveGroup<Instruction> *IG =
		CM.getInterleavedAccessGroup(Instr);
if (IG && Instr != IG->getInsertPos() &&		if (IG && Instr != IG->getInsertPos() &&
Range.Start >= 2 && // Query is illegal for VF == 1		Range.Start >= 2 && // Query is illegal for VF == 1
CM.getWideningDecision(Instr, Range.Start) ==		CM.getWideningDecision(Instr, Range.Start) ==
LoopVectorizationCostModel::CM_Interleave) {		LoopVectorizationCostModel::CM_Interleave) {
auto SinkCandidate = SinkAfterInverse.find(Instr);		auto SinkCandidate = SinkAfterInverse.find(Instr);
if (SinkCandidate != SinkAfterInverse.end())		if (SinkCandidate != SinkAfterInverse.end())
Ingredients.push_back(SinkCandidate->second);		Ingredients.push_back(SinkCandidate->second);
continue;		continue;
▲ Show 20 Lines • Show All 724 Lines • Show Last 20 Lines

lib/Transforms/Vectorize/VPlan.h

Show All 32 Lines
#include "llvm/ADT/GraphTraits.h"		#include "llvm/ADT/GraphTraits.h"
#include "llvm/ADT/Optional.h"		#include "llvm/ADT/Optional.h"
#include "llvm/ADT/SmallPtrSet.h"		#include "llvm/ADT/SmallPtrSet.h"
#include "llvm/ADT/SmallSet.h"		#include "llvm/ADT/SmallSet.h"
#include "llvm/ADT/SmallVector.h"		#include "llvm/ADT/SmallVector.h"
#include "llvm/ADT/Twine.h"		#include "llvm/ADT/Twine.h"
#include "llvm/ADT/ilist.h"		#include "llvm/ADT/ilist.h"
#include "llvm/ADT/ilist_node.h"		#include "llvm/ADT/ilist_node.h"
		#include "llvm/Analysis/VectorUtils.h"
#include "llvm/IR/IRBuilder.h"		#include "llvm/IR/IRBuilder.h"
#include <algorithm>		#include <algorithm>
#include <cassert>		#include <cassert>
#include <cstddef>		#include <cstddef>
#include <map>		#include <map>
#include <string>		#include <string>

namespace llvm {		namespace llvm {

class LoopVectorizationLegality;		class LoopVectorizationLegality;
class LoopVectorizationCostModel;		class LoopVectorizationCostModel;
class BasicBlock;		class BasicBlock;
class DominatorTree;		class DominatorTree;
class InnerLoopVectorizer;		class InnerLoopVectorizer;
class InterleaveGroup;		template <class T> class InterleaveGroup;
		class LoopInfo;
class raw_ostream;		class raw_ostream;
class Value;		class Value;
class VPBasicBlock;		class VPBasicBlock;
class VPRegionBlock;		class VPRegionBlock;
class VPlan;		class VPlan;

/// A range of powers-of-2 vectorization factors with fixed start and		/// A range of powers-of-2 vectorization factors with fixed start and
/// adjustable end. The range includes start and excludes end, e.g.,:		/// adjustable end. The range includes start and excludes end, e.g.,:
▲ Show 20 Lines • Show All 702 Lines • ▼ Show 20 Lines	public:
/// Print the recipe.		/// Print the recipe.
void print(raw_ostream &O, const Twine &Indent) const override;		void print(raw_ostream &O, const Twine &Indent) const override;
};		};

/// VPInterleaveRecipe is a recipe for transforming an interleave group of load		/// VPInterleaveRecipe is a recipe for transforming an interleave group of load
/// or stores into one wide load/store and shuffles.		/// or stores into one wide load/store and shuffles.
class VPInterleaveRecipe : public VPRecipeBase {		class VPInterleaveRecipe : public VPRecipeBase {
private:		private:
const InterleaveGroup *IG;		const InterleaveGroup<Instruction> *IG;
std::unique_ptr<VPUser> User;		std::unique_ptr<VPUser> User;

public:		public:
VPInterleaveRecipe(const InterleaveGroup IG, VPValue Mask)		VPInterleaveRecipe(const InterleaveGroup<Instruction> IG, VPValue Mask)
: VPRecipeBase(VPInterleaveSC), IG(IG) {		: VPRecipeBase(VPInterleaveSC), IG(IG) {
if (Mask) // Create a VPInstruction to register as a user of the mask.		if (Mask) // Create a VPInstruction to register as a user of the mask.
User.reset(new VPUser({Mask}));		User.reset(new VPUser({Mask}));
}		}
~VPInterleaveRecipe() override = default;		~VPInterleaveRecipe() override = default;

/// Method to support type inquiry through isa, cast, and dyn_cast.		/// Method to support type inquiry through isa, cast, and dyn_cast.
static inline bool classof(const VPRecipeBase *V) {		static inline bool classof(const VPRecipeBase *V) {
return V->getVPRecipeID() == VPRecipeBase::VPInterleaveSC;		return V->getVPRecipeID() == VPRecipeBase::VPInterleaveSC;
}		}

/// Generate the wide load or store, and shuffles.		/// Generate the wide load or store, and shuffles.
void execute(VPTransformState &State) override;		void execute(VPTransformState &State) override;

/// Print the recipe.		/// Print the recipe.
void print(raw_ostream &O, const Twine &Indent) const override;		void print(raw_ostream &O, const Twine &Indent) const override;

const InterleaveGroup *getInterleaveGroup() { return IG; }		const InterleaveGroup<Instruction> *getInterleaveGroup() { return IG; }
};		};

/// VPReplicateRecipe replicates a given instruction producing multiple scalar		/// VPReplicateRecipe replicates a given instruction producing multiple scalar
/// copies of the original scalar type, one per lane, instead of producing a		/// copies of the original scalar type, one per lane, instead of producing a
/// single copy of widened type for all lanes. If the instruction is known to be		/// single copy of widened type for all lanes. If the instruction is known to be
/// uniform only one copy, per lane zero, will be generated.		/// uniform only one copy, per lane zero, will be generated.
class VPReplicateRecipe : public VPRecipeBase {		class VPReplicateRecipe : public VPRecipeBase {
private:		private:
▲ Show 20 Lines • Show All 653 Lines • ▼ Show 20 Lines	public:
/// Disconnect VPBlockBases \p From and \p To bi-directionally. Remove \p To		/// Disconnect VPBlockBases \p From and \p To bi-directionally. Remove \p To
/// from the successors of \p From and \p From from the predecessors of \p To.		/// from the successors of \p From and \p From from the predecessors of \p To.
static void disconnectBlocks(VPBlockBase From, VPBlockBase To) {		static void disconnectBlocks(VPBlockBase From, VPBlockBase To) {
assert(To && "Successor to disconnect is null.");		assert(To && "Successor to disconnect is null.");
From->removeSuccessor(To);		From->removeSuccessor(To);
To->removePredecessor(From);		To->removePredecessor(From);
}		}
};		};

		class VPInterleavedAccessInfo {
		private:
		DenseMap<VPInstruction , InterleaveGroup<VPInstruction> >
		InterleaveGroupMap;

		public:
		VPInterleavedAccessInfo(VPlan &Plan, InterleavedAccessInfo &IAI);

		~VPInterleavedAccessInfo() {
		SmallPtrSet<InterleaveGroup<VPInstruction> *, 4> DelSet;
		// Avoid releasing a pointer twice.
		for (auto &I : InterleaveGroupMap)
		DelSet.insert(I.second);
		for (auto *Ptr : DelSet)
		delete Ptr;
		}

		/// Get the interleave group that \p Instr belongs to.
		///
		/// \returns nullptr if doesn't have such group.
		InterleaveGroup<VPInstruction> *
		getInterleaveGroup(VPInstruction *Instr) const {
		if (InterleaveGroupMap.count(Instr))
		return InterleaveGroupMap.find(Instr)->second;
		return nullptr;
		}
		};

		dcaballeUnsubmitted Not Done Reply Inline Actions Just curious. How difficult would it be to templatize the IAI methods needed here? dcaballe: Just curious. How difficult would it be to templatize the IAI methods needed here?
		fhahnAuthorUnsubmitted Not Done Reply Inline Actions I am not entirely sure, but most of the regular IAI is related to building the interleave groups, which is not required here because we re-using the regular one. fhahn: I am not entirely sure, but most of the regular IAI is related to building the interleave…
} // end namespace llvm		} // end namespace llvm

#endif // LLVM_TRANSFORMS_VECTORIZE_VPLAN_H		#endif // LLVM_TRANSFORMS_VECTORIZE_VPLAN_H

lib/Transforms/Vectorize/VPlan.cpp

Show First 20 Lines • Show All 674 Lines • ▼ Show 20 Lines	void VPWidenMemoryInstructionRecipe::print(raw_ostream &O,
if (User) {		if (User) {
O << ", ";		O << ", ";
User->getOperand(0)->printAsOperand(O);		User->getOperand(0)->printAsOperand(O);
}		}
O << "\\l\"";		O << "\\l\"";
}		}

template void DomTreeBuilder::Calculate<VPDominatorTree>(VPDominatorTree &DT);		template void DomTreeBuilder::Calculate<VPDominatorTree>(VPDominatorTree &DT);

		VPInterleavedAccessInfo::VPInterleavedAccessInfo(VPlan &Plan,
		InterleavedAccessInfo &IAI) {
		DenseMap<InterleaveGroup<Instruction> , InterleaveGroup<VPInstruction> >
		dcaballeUnsubmitted Done Reply Inline Actions This algorithm assumes that there is only a region (top region) in the whole H-CFG but this is going to change pretty soon. Could you please change the implementation to recursively go inside other potential nested regions? dcaballe: This algorithm assumes that there is only a region (top region) in the whole H-CFG but this is…
		fhahnAuthorUnsubmitted Not Done Reply Inline Actions Will do. I just have to think a bit more how everything will fit together with outerloops, as the regular InterleavedAccessInfo only works on a single loop. fhahn: Will do. I just have to think a bit more how everything will fit together with outerloops, as…
		Old2New;

		auto *TopRegion = cast<VPRegionBlock>(Plan.getEntry());
		ReversePostOrderTraversal<VPBlockBase *> RPOT(TopRegion->getEntry());
		for (VPBlockBase *Base : RPOT) {
		VPBasicBlock *VPBB = Base->getEntryBasicBlock();
		for (auto I = VPBB->begin(), E = VPBB->end(); I != E; I++) {
		dcaballeUnsubmitted Done Reply Inline Actions `auto ` for casts and dyn_cast (585, 591, 592)? dcaballe:* `auto *` for casts and dyn_cast (585, 591, 592)?
		assert(isa<VPInstruction>(&*I) && "Can only handle VPInstructions");
		auto VPInst = cast<VPInstruction>(&I);
		auto *Inst = cast<Instruction>(VPInst->getUnderlyingValue());
		auto *IG = IAI.getInterleaveGroup(Inst);
		if (!IG)
		continue;

		auto NewIGIter = Old2New.find(IG);
		rkruppeUnsubmitted Not Done Reply Inline Actions It doesn't seem like this memory is freed anywhere. Reading D49491 it seems to me that the InterleaveGroups allocated here are only needed while the `VPInterleavedAccessInfo` object is alive, so it could free them in its destructor (or even better, store `unique_ptr`s that take care of that automatically). rkruppe: It doesn't seem like this memory is freed anywhere. Reading D49491 it seems to me that the…
		fhahnAuthorUnsubmitted Not Done Reply Inline Actions Yep thanks! They should be freed in VPInterleavedAccessInfo's destructor. fhahn: Yep thanks! They should be freed in VPInterleavedAccessInfo's destructor.
		if (NewIGIter == Old2New.end())
		Old2New[IG] = new InterleaveGroup<VPInstruction>(
		IG->getFactor(), IG->isReverse(), IG->getAlignment());

		if (Inst == IG->getInsertPos())
		Old2New[IG]->setInsertPos(VPInst);

		InterleaveGroupMap[VPInst] = Old2New[IG];
		InterleaveGroupMap[VPInst]->insertMember(
		VPInst, IG->getIndex(Inst),
		IG->isReverse() ? (-1) * int(IG->getFactor()) : IG->getFactor());
		}
		}
		}

lib/Transforms/Vectorize/VPlanValue.h

	Show All 34 Lines
	// This is the base class of the VPlan Def/Use graph, used for modeling the data			// This is the base class of the VPlan Def/Use graph, used for modeling the data
	// flow into, within and out of the VPlan. VPValues can stand for live-ins			// flow into, within and out of the VPlan. VPValues can stand for live-ins
	// coming from the input IR, instructions which VPlan will generate if executed			// coming from the input IR, instructions which VPlan will generate if executed
	// and live-outs which the VPlan will need to fix accordingly.			// and live-outs which the VPlan will need to fix accordingly.
	class VPValue {			class VPValue {
	friend class VPBuilder;			friend class VPBuilder;
	friend class VPlanHCFGTransforms;			friend class VPlanHCFGTransforms;
	friend class VPBasicBlock;			friend class VPBasicBlock;
				friend class VPInterleavedAccessInfo;

	private:			private:
	const unsigned char SubclassID; ///< Subclass identifier (for isa/dyn_cast).			const unsigned char SubclassID; ///< Subclass identifier (for isa/dyn_cast).

	SmallVector<VPUser *, 1> Users;			SmallVector<VPUser *, 1> Users;

	protected:			protected:
	// Hold the underlying Value, if any, attached to this VPValue.			// Hold the underlying Value, if any, attached to this VPValue.
	▲ Show 20 Lines • Show All 120 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[VPlan] VPlan version of InterleavedAccessInfo.
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 173825

include/llvm/Analysis/VectorUtils.h

lib/Analysis/VectorUtils.cpp

lib/Transforms/Vectorize/LoopVectorize.cpp

lib/Transforms/Vectorize/VPlan.h

lib/Transforms/Vectorize/VPlan.cpp

lib/Transforms/Vectorize/VPlanValue.h

This is an archive of the discontinued LLVM Phabricator instance.

[VPlan] VPlan version of InterleavedAccessInfo.ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 173825

include/llvm/Analysis/VectorUtils.h

lib/Analysis/VectorUtils.cpp

lib/Transforms/Vectorize/LoopVectorize.cpp

lib/Transforms/Vectorize/VPlan.h

lib/Transforms/Vectorize/VPlan.cpp

lib/Transforms/Vectorize/VPlanValue.h

[VPlan] VPlan version of InterleavedAccessInfo.
ClosedPublic