Diff 372078

llvm/include/llvm/Analysis/IVDescriptors.h

Show First 20 Lines • Show All 111 Lines • ▼ Show 20 Lines	public:
};		};

/// Returns a struct describing if the instruction 'I' can be a recurrence		/// Returns a struct describing if the instruction 'I' can be a recurrence
/// variable of type 'Kind'. If the recurrence is a min/max pattern of		/// variable of type 'Kind'. If the recurrence is a min/max pattern of
/// select(icmp()) this function advances the instruction pointer 'I' from the		/// select(icmp()) this function advances the instruction pointer 'I' from the
/// compare instruction to the select instruction and stores this pointer in		/// compare instruction to the select instruction and stores this pointer in
/// 'PatternLastInst' member of the returned struct.		/// 'PatternLastInst' member of the returned struct.
static InstDesc isRecurrenceInstr(Instruction *I, RecurKind Kind,		static InstDesc isRecurrenceInstr(Instruction *I, RecurKind Kind,
InstDesc &Prev, FastMathFlags FMF);		InstDesc &Prev, FastMathFlags FuncFMF);

/// Returns true if instruction I has multiple uses in Insts		/// Returns true if instruction I has multiple uses in Insts
static bool hasMultipleUsesOf(Instruction *I,		static bool hasMultipleUsesOf(Instruction *I,
SmallPtrSetImpl<Instruction *> &Insts,		SmallPtrSetImpl<Instruction *> &Insts,
unsigned MaxNumUses);		unsigned MaxNumUses);

/// Returns true if all uses of the instruction I is within the Set.		/// Returns true if all uses of the instruction I is within the Set.
static bool areAllUsesIn(Instruction I, SmallPtrSetImpl<Instruction > &Set);		static bool areAllUsesIn(Instruction I, SmallPtrSetImpl<Instruction > &Set);

/// Returns a struct describing if the instruction is a		/// Returns a struct describing if the instruction is a llvm.(s/u)(min/max),
/// Select(ICmp(X, Y), X, Y) instruction pattern corresponding to a min(X, Y)		/// llvm.minnum/maxnum or a Select(ICmp(X, Y), X, Y) pair of instructions
/// or max(X, Y). \p Prev specifies the description of an already processed		/// corresponding to a min(X, Y) or max(X, Y), matching the recurrence kind \p
/// select instruction, so its corresponding cmp can be matched to it.		/// Kind. \p Prev specifies the description of an already processed select
static InstDesc isMinMaxSelectCmpPattern(Instruction *I,		/// instruction, so its corresponding cmp can be matched to it.
		static InstDesc isMinMaxSelectCmpPattern(Instruction *I, RecurKind Kind,
		spatelUnsubmitted Not Done Reply Inline Actions Should this be called "isMinMaxPattern" now since it matches both intrinsics and select-cmp? spatel: Should this be called "isMinMaxPattern" now since it matches both intrinsics and select-cmp?
const InstDesc &Prev);		const InstDesc &Prev);

/// Returns a struct describing if the instruction is a		/// Returns a struct describing if the instruction is a
/// Select(FCmp(X, Y), (Z = X op PHINode), PHINode) instruction pattern.		/// Select(FCmp(X, Y), (Z = X op PHINode), PHINode) instruction pattern.
static InstDesc isConditionalRdxPattern(RecurKind Kind, Instruction *I);		static InstDesc isConditionalRdxPattern(RecurKind Kind, Instruction *I);

/// Returns identity corresponding to the RecurrenceKind.		/// Returns identity corresponding to the RecurrenceKind.
static Constant getRecurrenceIdentity(RecurKind K, Type Tp,		static Constant getRecurrenceIdentity(RecurKind K, Type Tp,
FastMathFlags FMF);		FastMathFlags FMF);

/// Returns the opcode corresponding to the RecurrenceKind.		/// Returns the opcode corresponding to the RecurrenceKind.
static unsigned getOpcode(RecurKind Kind);		static unsigned getOpcode(RecurKind Kind);

/// Returns true if Phi is a reduction of type Kind and adds it to the		/// Returns true if Phi is a reduction of type Kind and adds it to the
/// RecurrenceDescriptor. If either \p DB is non-null or \p AC and \p DT are		/// RecurrenceDescriptor. If either \p DB is non-null or \p AC and \p DT are
/// non-null, the minimal bit width needed to compute the reduction will be		/// non-null, the minimal bit width needed to compute the reduction will be
/// computed.		/// computed.
static bool AddReductionVar(PHINode Phi, RecurKind Kind, Loop TheLoop,		static bool AddReductionVar(PHINode Phi, RecurKind Kind, Loop TheLoop,
FastMathFlags FMF,		FastMathFlags FuncFMF,
RecurrenceDescriptor &RedDes,		RecurrenceDescriptor &RedDes,
DemandedBits *DB = nullptr,		DemandedBits *DB = nullptr,
AssumptionCache *AC = nullptr,		AssumptionCache *AC = nullptr,
DominatorTree *DT = nullptr);		DominatorTree *DT = nullptr);

/// Returns true if Phi is a reduction in TheLoop. The RecurrenceDescriptor		/// Returns true if Phi is a reduction in TheLoop. The RecurrenceDescriptor
/// is returned in RedDes. If either \p DB is non-null or \p AC and \p DT are		/// is returned in RedDes. If either \p DB is non-null or \p AC and \p DT are
/// non-null, the minimal bit width needed to compute the reduction will be		/// non-null, the minimal bit width needed to compute the reduction will be
▲ Show 20 Lines • Show All 208 Lines • Show Last 20 Lines

llvm/lib/Analysis/IVDescriptors.cpp

Show First 20 Lines • Show All 417 Lines • ▼ Show 20 Lines	for (User *U : Cur->users()) {
if (isa<PHINode>(UI))		if (isa<PHINode>(UI))
PHIs.push_back(UI);		PHIs.push_back(UI);
else		else
NonPHIs.push_back(UI);		NonPHIs.push_back(UI);
} else if (!isa<PHINode>(UI) &&		} else if (!isa<PHINode>(UI) &&
((!isa<FCmpInst>(UI) && !isa<ICmpInst>(UI) &&		((!isa<FCmpInst>(UI) && !isa<ICmpInst>(UI) &&
!isa<SelectInst>(UI)) \|\|		!isa<SelectInst>(UI)) \|\|
(!isConditionalRdxPattern(Kind, UI).isRecurrence() &&		(!isConditionalRdxPattern(Kind, UI).isRecurrence() &&
!isMinMaxSelectCmpPattern(UI, IgnoredVal).isRecurrence())))		!isMinMaxSelectCmpPattern(UI, Kind, IgnoredVal)
		.isRecurrence())))
return false;		return false;

// Remember that we completed the cycle.		// Remember that we completed the cycle.
if (UI == Phi)		if (UI == Phi)
FoundStartPHI = true;		FoundStartPHI = true;
}		}
Worklist.append(PHIs.begin(), PHIs.end());		Worklist.append(PHIs.begin(), PHIs.end());
Worklist.append(NonPHIs.begin(), NonPHIs.end());		Worklist.append(NonPHIs.begin(), NonPHIs.end());
}		}

// This means we have seen one but not the other instruction of the		// This means we have seen one but not the other instruction of the
// pattern or more than just a select and cmp.		// pattern or more than just a select and cmp. Zero implies that we saw a
if (isMinMaxRecurrenceKind(Kind) && NumCmpSelectPatternInst != 2)		// llvm.min/max instrinsic, which is always OK.
		if (isMinMaxRecurrenceKind(Kind) && NumCmpSelectPatternInst != 2 &&
		NumCmpSelectPatternInst != 0)
return false;		return false;

if (!FoundStartPHI \|\| !FoundReduxOp \|\| !ExitInstruction)		if (!FoundStartPHI \|\| !FoundReduxOp \|\| !ExitInstruction)
return false;		return false;

const bool IsOrdered = checkOrderedReduction(		const bool IsOrdered = checkOrderedReduction(
Kind, ReduxDesc.getExactFPMathInst(), ExitInstruction, Phi);		Kind, ReduxDesc.getExactFPMathInst(), ExitInstruction, Phi);

▲ Show 20 Lines • Show All 53 Lines • ▼ Show 20 Lines	RecurrenceDescriptor RD(RdxStart, ExitInstruction, Kind, FMF,
ReduxDesc.getExactFPMathInst(), RecurrenceType,		ReduxDesc.getExactFPMathInst(), RecurrenceType,
IsSigned, IsOrdered, CastInsts);		IsSigned, IsOrdered, CastInsts);
RedDes = RD;		RedDes = RD;

return true;		return true;
}		}

RecurrenceDescriptor::InstDesc		RecurrenceDescriptor::InstDesc
RecurrenceDescriptor::isMinMaxSelectCmpPattern(Instruction *I,		RecurrenceDescriptor::isMinMaxSelectCmpPattern(Instruction *I, RecurKind Kind,
const InstDesc &Prev) {		const InstDesc &Prev) {
assert((isa<CmpInst>(I) \|\| isa<SelectInst>(I)) &&		assert((isa<CmpInst>(I) \|\| isa<SelectInst>(I) \|\| isa<CallInst>(I)) &&
"Expected a cmp or select instruction");		"Expected a cmp or select or call instruction");
		if (!isMinMaxRecurrenceKind(Kind))
		return InstDesc(false, I);

// We must handle the select(cmp()) as a single instruction. Advance to the		// We must handle the select(cmp()) as a single instruction. Advance to the
// select.		// select.
CmpInst::Predicate Pred;		CmpInst::Predicate Pred;
if (match(I, m_OneUse(m_Cmp(Pred, m_Value(), m_Value())))) {		if (match(I, m_OneUse(m_Cmp(Pred, m_Value(), m_Value())))) {
if (auto Select = dyn_cast<SelectInst>(I->user_begin()))		if (auto Select = dyn_cast<SelectInst>(I->user_begin()))
return InstDesc(Select, Prev.getRecKind());		return InstDesc(Select, Prev.getRecKind());
}		}

// Only match select with single use cmp condition.		// Only match select with single use cmp condition, or a min/max intrinsic.
if (!match(I, m_Select(m_OneUse(m_Cmp(Pred, m_Value(), m_Value())), m_Value(),		if (!isa<IntrinsicInst>(I) &&
		!match(I, m_Select(m_OneUse(m_Cmp(Pred, m_Value(), m_Value())), m_Value(),
m_Value())))		m_Value())))
return InstDesc(false, I);		return InstDesc(false, I);

// Look for a min/max pattern.		// Look for a min/max pattern.
if (match(I, m_UMin(m_Value(), m_Value())))		if (match(I, m_UMin(m_Value(), m_Value())))
return InstDesc(I, RecurKind::UMin);		return InstDesc(Kind == RecurKind::UMin, I);
if (match(I, m_UMax(m_Value(), m_Value())))		if (match(I, m_UMax(m_Value(), m_Value())))
return InstDesc(I, RecurKind::UMax);		return InstDesc(Kind == RecurKind::UMax, I);
if (match(I, m_SMax(m_Value(), m_Value())))		if (match(I, m_SMax(m_Value(), m_Value())))
return InstDesc(I, RecurKind::SMax);		return InstDesc(Kind == RecurKind::SMax, I);
if (match(I, m_SMin(m_Value(), m_Value())))		if (match(I, m_SMin(m_Value(), m_Value())))
return InstDesc(I, RecurKind::SMin);		return InstDesc(Kind == RecurKind::SMin, I);
if (match(I, m_OrdFMin(m_Value(), m_Value())))		if (match(I, m_OrdFMin(m_Value(), m_Value())))
return InstDesc(I, RecurKind::FMin);		return InstDesc(Kind == RecurKind::FMin, I);
if (match(I, m_OrdFMax(m_Value(), m_Value())))		if (match(I, m_OrdFMax(m_Value(), m_Value())))
return InstDesc(I, RecurKind::FMax);		return InstDesc(Kind == RecurKind::FMax, I);
if (match(I, m_UnordFMin(m_Value(), m_Value())))		if (match(I, m_UnordFMin(m_Value(), m_Value())))
return InstDesc(I, RecurKind::FMin);		return InstDesc(Kind == RecurKind::FMin, I);
if (match(I, m_UnordFMax(m_Value(), m_Value())))		if (match(I, m_UnordFMax(m_Value(), m_Value())))
return InstDesc(I, RecurKind::FMax);		return InstDesc(Kind == RecurKind::FMax, I);
		if (match(I, m_Intrinsic<Intrinsic::minnum>(m_Value(), m_Value())))
		return InstDesc(Kind == RecurKind::FMin, I);
		if (match(I, m_Intrinsic<Intrinsic::maxnum>(m_Value(), m_Value())))
		return InstDesc(Kind == RecurKind::FMax, I);

return InstDesc(false, I);		return InstDesc(false, I);
}		}

/// Returns true if the select instruction has users in the compare-and-add		/// Returns true if the select instruction has users in the compare-and-add
/// reduction pattern below. The select instruction argument is the last one		/// reduction pattern below. The select instruction argument is the last one
/// in the sequence.		/// in the sequence.
///		///
Show All 36 Lines	RecurrenceDescriptor::isConditionalRdxPattern(RecurKind Kind, Instruction *I) {
if (m_FMul(m_Value(Op1), m_Value(Op2)).match(I1) && (I1->isFast()))		if (m_FMul(m_Value(Op1), m_Value(Op2)).match(I1) && (I1->isFast()))
return InstDesc(Kind == RecurKind::FMul, SI);		return InstDesc(Kind == RecurKind::FMul, SI);

return InstDesc(false, I);		return InstDesc(false, I);
}		}

RecurrenceDescriptor::InstDesc		RecurrenceDescriptor::InstDesc
RecurrenceDescriptor::isRecurrenceInstr(Instruction *I, RecurKind Kind,		RecurrenceDescriptor::isRecurrenceInstr(Instruction *I, RecurKind Kind,
InstDesc &Prev, FastMathFlags FMF) {		InstDesc &Prev, FastMathFlags FuncFMF) {
		assert(Prev.getRecKind() == RecurKind::None \|\| Prev.getRecKind() == Kind);
switch (I->getOpcode()) {		switch (I->getOpcode()) {
default:		default:
return InstDesc(false, I);		return InstDesc(false, I);
case Instruction::PHI:		case Instruction::PHI:
return InstDesc(I, Prev.getRecKind(), Prev.getExactFPMathInst());		return InstDesc(I, Prev.getRecKind(), Prev.getExactFPMathInst());
case Instruction::Sub:		case Instruction::Sub:
case Instruction::Add:		case Instruction::Add:
return InstDesc(Kind == RecurKind::Add, I);		return InstDesc(Kind == RecurKind::Add, I);
Show All 14 Lines	case Instruction::FAdd:
return InstDesc(Kind == RecurKind::FAdd, I,		return InstDesc(Kind == RecurKind::FAdd, I,
I->hasAllowReassoc() ? nullptr : I);		I->hasAllowReassoc() ? nullptr : I);
case Instruction::Select:		case Instruction::Select:
if (Kind == RecurKind::FAdd \|\| Kind == RecurKind::FMul)		if (Kind == RecurKind::FAdd \|\| Kind == RecurKind::FMul)
return isConditionalRdxPattern(Kind, I);		return isConditionalRdxPattern(Kind, I);
LLVM_FALLTHROUGH;		LLVM_FALLTHROUGH;
case Instruction::FCmp:		case Instruction::FCmp:
case Instruction::ICmp:		case Instruction::ICmp:
		case Instruction::Call:
if (isIntMinMaxRecurrenceKind(Kind) \|\|		if (isIntMinMaxRecurrenceKind(Kind) \|\|
(FMF.noNaNs() && FMF.noSignedZeros() && isFPMinMaxRecurrenceKind(Kind)))		(((FuncFMF.noNaNs() && FuncFMF.noSignedZeros()) \|\|
return isMinMaxSelectCmpPattern(I, Prev);		(isa<FPMathOperator>(I) && I->hasNoNaNs() &&
		I->hasNoSignedZeros())) &&
		isFPMinMaxRecurrenceKind(Kind)))
		return isMinMaxSelectCmpPattern(I, Kind, Prev);
return InstDesc(false, I);		return InstDesc(false, I);
}		}
}		}

bool RecurrenceDescriptor::hasMultipleUsesOf(		bool RecurrenceDescriptor::hasMultipleUsesOf(
Instruction I, SmallPtrSetImpl<Instruction > &Insts,		Instruction I, SmallPtrSetImpl<Instruction > &Insts,
unsigned MaxNumUses) {		unsigned MaxNumUses) {
unsigned NumUses = 0;		unsigned NumUses = 0;
▲ Show 20 Lines • Show All 654 Lines • Show Last 20 Lines

llvm/test/Transforms/LoopVectorize/minmax_reduction.ll

Show First 20 Lines • Show All 868 Lines • ▼ Show 20 Lines	for.body:
%max.red.0 = select i1 %cmp3, float %0, float %max.red.08		%max.red.0 = select i1 %cmp3, float %0, float %max.red.08
%indvars.iv.next = add i64 %indvars.iv, 1		%indvars.iv.next = add i64 %indvars.iv, 1
%exitcond = icmp eq i64 %indvars.iv.next, 1024		%exitcond = icmp eq i64 %indvars.iv.next, 1024
br i1 %exitcond, label %for.end, label %for.body		br i1 %exitcond, label %for.end, label %for.body

for.end:		for.end:
ret float %max.red.0		ret float %max.red.0
}		}

		; CHECK-LABEL: @smin_intrinsic(
		spatelUnsubmitted Not Done Reply Inline Actions Does this call (and also fmin above) have the expected FMF too? spatel: Does this call (and also fmin above) have the expected FMF too?
		; CHECK: call <2 x i32> @llvm.smin.v2i32
		define i32 @smin_intrinsic(i32* nocapture readonly %x) {
		entry:
		br label %for.body

		for.body: ; preds = %entry, %for.body
		%i.012 = phi i32 [ 0, %entry ], [ %inc, %for.body ]
		%s.011 = phi i32 [ 100, %entry ], [ %1, %for.body ]
		%arrayidx = getelementptr inbounds i32, i32* %x, i32 %i.012
		%0 = load i32, i32* %arrayidx, align 4
		%1 = tail call i32 @llvm.smin.i32(i32 %s.011, i32 %0)
		%inc = add nuw nsw i32 %i.012, 1
		%exitcond.not = icmp eq i32 %inc, 1024
		br i1 %exitcond.not, label %for.cond.cleanup, label %for.body

		for.cond.cleanup: ; preds = %for.body
		ret i32 %1
		}

		; CHECK-LABEL: @smax_intrinsic(
		; CHECK: call <2 x i32> @llvm.smax.v2i32
		define i32 @smax_intrinsic(i32* nocapture readonly %x) {
		entry:
		br label %for.body

		for.body: ; preds = %entry, %for.body
		%i.012 = phi i32 [ 0, %entry ], [ %inc, %for.body ]
		%s.011 = phi i32 [ 100, %entry ], [ %1, %for.body ]
		%arrayidx = getelementptr inbounds i32, i32* %x, i32 %i.012
		%0 = load i32, i32* %arrayidx, align 4
		%1 = tail call i32 @llvm.smax.i32(i32 %s.011, i32 %0)
		%inc = add nuw nsw i32 %i.012, 1
		%exitcond.not = icmp eq i32 %inc, 1024
		br i1 %exitcond.not, label %for.cond.cleanup, label %for.body

		for.cond.cleanup: ; preds = %for.body
		ret i32 %1
		}

		; CHECK-LABEL: @umin_intrinsic(
		; CHECK: call <2 x i32> @llvm.umin.v2i32
		define i32 @umin_intrinsic(i32* nocapture readonly %x) {
		entry:
		br label %for.body

		for.body: ; preds = %entry, %for.body
		%i.012 = phi i32 [ 0, %entry ], [ %inc, %for.body ]
		%s.011 = phi i32 [ 100, %entry ], [ %1, %for.body ]
		%arrayidx = getelementptr inbounds i32, i32* %x, i32 %i.012
		%0 = load i32, i32* %arrayidx, align 4
		%1 = tail call i32 @llvm.umin.i32(i32 %s.011, i32 %0)
		%inc = add nuw nsw i32 %i.012, 1
		%exitcond.not = icmp eq i32 %inc, 1024
		br i1 %exitcond.not, label %for.cond.cleanup, label %for.body

		for.cond.cleanup: ; preds = %for.body
		ret i32 %1
		}

		; CHECK-LABEL: @umax_intrinsic(
		; CHECK: call <2 x i32> @llvm.umax.v2i32
		define i32 @umax_intrinsic(i32* nocapture readonly %x) {
		entry:
		br label %for.body

		for.body: ; preds = %entry, %for.body
		%i.012 = phi i32 [ 0, %entry ], [ %inc, %for.body ]
		%s.011 = phi i32 [ 100, %entry ], [ %1, %for.body ]
		%arrayidx = getelementptr inbounds i32, i32* %x, i32 %i.012
		%0 = load i32, i32* %arrayidx, align 4
		%1 = tail call i32 @llvm.umax.i32(i32 %s.011, i32 %0)
		%inc = add nuw nsw i32 %i.012, 1
		%exitcond.not = icmp eq i32 %inc, 1024
		br i1 %exitcond.not, label %for.cond.cleanup, label %for.body

		for.cond.cleanup: ; preds = %for.body
		ret i32 %1
		}

		; CHECK-LABEL: @fmin_intrinsic(
		; CHECK: call fast <2 x float> @llvm.minnum.v2f32
		define float @fmin_intrinsic(float* nocapture readonly %x) {
		entry:
		br label %for.body

		for.cond.cleanup: ; preds = %for.body
		ret float %1

		for.body: ; preds = %entry, %for.body
		%i.012 = phi i32 [ 0, %entry ], [ %inc, %for.body ]
		%s.011 = phi float [ 0.000000e+00, %entry ], [ %1, %for.body ]
		%arrayidx = getelementptr inbounds float, float* %x, i32 %i.012
		%0 = load float, float* %arrayidx, align 4
		%1 = tail call fast float @llvm.minnum.f32(float %s.011, float %0)
		%inc = add nuw nsw i32 %i.012, 1
		%exitcond.not = icmp eq i32 %inc, 1024
		br i1 %exitcond.not, label %for.cond.cleanup, label %for.body
		}

		; CHECK-LABEL: @fmax_intrinsic(
		; CHECK: call fast <2 x float> @llvm.maxnum.v2f32
		define float @fmax_intrinsic(float* nocapture readonly %x) {
		entry:
		br label %for.body

		for.cond.cleanup: ; preds = %for.body
		ret float %1

		for.body: ; preds = %entry, %for.body
		%i.012 = phi i32 [ 0, %entry ], [ %inc, %for.body ]
		%s.011 = phi float [ 0.000000e+00, %entry ], [ %1, %for.body ]
		%arrayidx = getelementptr inbounds float, float* %x, i32 %i.012
		%0 = load float, float* %arrayidx, align 4
		%1 = tail call fast float @llvm.maxnum.f32(float %s.011, float %0)
		%inc = add nuw nsw i32 %i.012, 1
		%exitcond.not = icmp eq i32 %inc, 1024
		br i1 %exitcond.not, label %for.cond.cleanup, label %for.body
		}

		; CHECK-LABEL: @sminmax(
		; Min and max intrinsics - don't vectorize
		; CHECK-NOT: <2 x i32>
		define i32 @sminmax(i32* nocapture readonly %x, i32* nocapture readonly %y) {
		entry:
		br label %for.body

		for.cond.cleanup: ; preds = %for.body
		ret i32 %cond9

		for.body: ; preds = %entry, %for.body
		%i.025 = phi i32 [ 0, %entry ], [ %inc, %for.body ]
		%s.024 = phi i32 [ 0, %entry ], [ %cond9, %for.body ]
		%arrayidx = getelementptr inbounds i32, i32* %x, i32 %i.025
		%0 = load i32, i32* %arrayidx, align 4
		%s.0. = tail call i32 @llvm.smin.i32(i32 %s.024, i32 %0)
		%arrayidx3 = getelementptr inbounds i32, i32* %y, i32 %i.025
		%1 = load i32, i32* %arrayidx3, align 4
		%cond9 = tail call i32 @llvm.smax.i32(i32 %s.0., i32 %1)
		%inc = add nuw nsw i32 %i.025, 1
		%exitcond.not = icmp eq i32 %inc, 1024
		br i1 %exitcond.not, label %for.cond.cleanup, label %for.body
		}

		; CHECK-LABEL: @sminmin(
		; CHECK: call <2 x i32> @llvm.smin.v2i32
		; CHECK: call <2 x i32> @llvm.smin.v2i32
		define i32 @sminmin(i32* nocapture readonly %x, i32* nocapture readonly %y) {
		entry:
		br label %for.body

		for.cond.cleanup: ; preds = %for.body
		ret i32 %cond9

		for.body: ; preds = %entry, %for.body
		%i.025 = phi i32 [ 0, %entry ], [ %inc, %for.body ]
		%s.024 = phi i32 [ 0, %entry ], [ %cond9, %for.body ]
		%arrayidx = getelementptr inbounds i32, i32* %x, i32 %i.025
		%0 = load i32, i32* %arrayidx, align 4
		%s.0. = tail call i32 @llvm.smin.i32(i32 %s.024, i32 %0)
		%arrayidx3 = getelementptr inbounds i32, i32* %y, i32 %i.025
		%1 = load i32, i32* %arrayidx3, align 4
		%cond9 = tail call i32 @llvm.smin.i32(i32 %s.0., i32 %1)
		%inc = add nuw nsw i32 %i.025, 1
		%exitcond.not = icmp eq i32 %inc, 1024
		br i1 %exitcond.not, label %for.cond.cleanup, label %for.body
		}

; Make sure any check-not directives are not triggered by function declarations.		; Make sure any check-not directives are not triggered by function declarations.
		spatelUnsubmitted Not Done Reply Inline Actions Either this test or the previous one could be just "nnan nsz" rather than "fast" so we are testing the minimum FMF (assuming that works as expected). spatel: Either this test or the previous one could be just "nnan nsz" rather than "fast" so we are…
		spatelUnsubmitted Not Done Reply Inline Actions Sorry if I wasn't clear, but it would be better to have one of these tests have minimal FMF and one have extra FMF (ie, the original 'fast' was good) because that shows we are propagating all FMF as expected even if they are not required for the transform. Alternatively, we could add a 2nd test for maxnum with 'fast'. spatel: Sorry if I wasn't clear, but it would be better to have one of these tests have minimal FMF and…
; CHECK: declare		; CHECK: declare

		declare i32 @llvm.smin.i32(i32, i32)
		declare i32 @llvm.smax.i32(i32, i32)
		declare i32 @llvm.umin.i32(i32, i32)
		declare i32 @llvm.umax.i32(i32, i32)
		declare float @llvm.minnum.f32(float, float)
		declare float @llvm.maxnum.f32(float, float)

attributes #0 = { "no-nans-fp-math"="true" "no-signed-zeros-fp-math"="true" }		attributes #0 = { "no-nans-fp-math"="true" "no-signed-zeros-fp-math"="true" }
attributes #1 = { "no-nans-fp-math"="true" }		attributes #1 = { "no-nans-fp-math"="true" }

This is an archive of the discontinued LLVM Phabricator instance.

[LV] Recognize intrinsic min/max reductions
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 372078

llvm/include/llvm/Analysis/IVDescriptors.h

llvm/lib/Analysis/IVDescriptors.cpp

llvm/test/Transforms/LoopVectorize/minmax_reduction.ll

This is an archive of the discontinued LLVM Phabricator instance.

[LV] Recognize intrinsic min/max reductionsClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 372078

llvm/include/llvm/Analysis/IVDescriptors.h

llvm/lib/Analysis/IVDescriptors.cpp

llvm/test/Transforms/LoopVectorize/minmax_reduction.ll

[LV] Recognize intrinsic min/max reductions
ClosedPublic