Diff 436028

llvm/lib/Target/RISCV/RISCVTargetTransformInfo.cpp

Show First 20 Lines • Show All 317 Lines • ▼ Show 20 Lines	RISCVTTIImpl::getMinMaxReductionCost(VectorType Ty, VectorType CondTy,

if (!ST->useRVVForFixedLengthVectors())		if (!ST->useRVVForFixedLengthVectors())
return BaseT::getMinMaxReductionCost(Ty, CondTy, IsUnsigned, CostKind);		return BaseT::getMinMaxReductionCost(Ty, CondTy, IsUnsigned, CostKind);

// Skip if scalar size of Ty is bigger than ELEN.		// Skip if scalar size of Ty is bigger than ELEN.
if (Ty->getScalarSizeInBits() > ST->getELEN())		if (Ty->getScalarSizeInBits() > ST->getELEN())
return BaseT::getMinMaxReductionCost(Ty, CondTy, IsUnsigned, CostKind);		return BaseT::getMinMaxReductionCost(Ty, CondTy, IsUnsigned, CostKind);

		std::pair<InstructionCost, MVT> LT = TLI->getTypeLegalizationCost(DL, Ty);
		if (Ty->getElementType()->isIntegerTy(1))
		craig.topperUnsubmitted Not Done Reply Inline Actions I really hope that max/min of i1 don't occur in normal scenarios. craig.topper: I really hope that max/min of i1 don't occur in normal scenarios.
		// vcpop sequences, see vreduction-mask.ll. umax, smin actually only
		// cost 2, but we don't have enough info here so we slightly over cost.
		frasercrmckUnsubmitted Not Done Reply Inline Actions One thing I've noticed is that we do use increasingly more `vmnand` as the vectors become larger and have to be split. Should we be taking this into account? See e.g. an `and` reduce with -riscv-v-vector-bits-min=128: <256 x i1>: vmnot.m v8, v0 vcpop.m a0, v8 <512 x i1>: vmand.mm v8, v8, v10 vmand.mm v9, v0, v9 vmnand.mm v8, v9, v8 vcpop.m a0, v8 <1024 x i1>: vmand.mm v10, v10, v14 vmand.mm v8, v8, v12 vmand.mm v8, v8, v10 vmand.mm v9, v9, v13 vmand.mm v10, v0, v11 vmand.mm v9, v10, v9 vmnand.mm v8, v9, v8 vcpop.m a0, v8 frasercrmck: One thing I've noticed is that we do use increasingly more `vmnand` as the vectors become…
		reamesAuthorUnsubmitted Done Reply Inline Actions Good catch, thanks! reames: Good catch, thanks!
		return (LT.first - 1) + 3;

// IR Reduction is composed by two vmv and one rvv reduction instruction.		// IR Reduction is composed by two vmv and one rvv reduction instruction.
InstructionCost BaseCost = 2;		InstructionCost BaseCost = 2;
unsigned VL = cast<FixedVectorType>(Ty)->getNumElements();		unsigned VL = cast<FixedVectorType>(Ty)->getNumElements();
std::pair<InstructionCost, MVT> LT = TLI->getTypeLegalizationCost(DL, Ty);
return (LT.first - 1) + BaseCost + Log2_32_Ceil(VL);		return (LT.first - 1) + BaseCost + Log2_32_Ceil(VL);
}		}

InstructionCost		InstructionCost
RISCVTTIImpl::getArithmeticReductionCost(unsigned Opcode, VectorType *VTy,		RISCVTTIImpl::getArithmeticReductionCost(unsigned Opcode, VectorType *VTy,
Optional<FastMathFlags> FMF,		Optional<FastMathFlags> FMF,
TTI::TargetCostKind CostKind) {		TTI::TargetCostKind CostKind) {
// FIXME: Only supporting fixed vectors for now.		// FIXME: Only supporting fixed vectors for now.
if (!isa<FixedVectorType>(VTy))		if (!isa<FixedVectorType>(VTy))
return BaseT::getArithmeticReductionCost(Opcode, VTy, FMF, CostKind);		return BaseT::getArithmeticReductionCost(Opcode, VTy, FMF, CostKind);

// FIXME: Do not support i1 and/or reduction now.
if (VTy->getElementType()->isIntegerTy(1))
return BaseT::getArithmeticReductionCost(Opcode, VTy, FMF, CostKind);

if (!ST->useRVVForFixedLengthVectors())		if (!ST->useRVVForFixedLengthVectors())
return BaseT::getArithmeticReductionCost(Opcode, VTy, FMF, CostKind);		return BaseT::getArithmeticReductionCost(Opcode, VTy, FMF, CostKind);

// Skip if scalar size of VTy is bigger than ELEN.		// Skip if scalar size of VTy is bigger than ELEN.
if (VTy->getScalarSizeInBits() > ST->getELEN())		if (VTy->getScalarSizeInBits() > ST->getELEN())
return BaseT::getArithmeticReductionCost(Opcode, VTy, FMF, CostKind);		return BaseT::getArithmeticReductionCost(Opcode, VTy, FMF, CostKind);

int ISD = TLI->InstructionOpcodeToISD(Opcode);		int ISD = TLI->InstructionOpcodeToISD(Opcode);
assert(ISD && "Invalid opcode");		assert(ISD && "Invalid opcode");

if (ISD != ISD::ADD && ISD != ISD::OR && ISD != ISD::XOR && ISD != ISD::AND &&		if (ISD != ISD::ADD && ISD != ISD::OR && ISD != ISD::XOR && ISD != ISD::AND &&
ISD != ISD::FADD)		ISD != ISD::FADD)
return BaseT::getArithmeticReductionCost(Opcode, VTy, FMF, CostKind);		return BaseT::getArithmeticReductionCost(Opcode, VTy, FMF, CostKind);

		std::pair<InstructionCost, MVT> LT = TLI->getTypeLegalizationCost(DL, VTy);
		if (VTy->getElementType()->isIntegerTy(1))
		// vcpop sequences, see vreduction-mask.ll
		return (LT.first - 1) + (ISD == ISD::AND ? 3 : 2);

// IR Reduction is composed by two vmv and one rvv reduction instruction.		// IR Reduction is composed by two vmv and one rvv reduction instruction.
InstructionCost BaseCost = 2;		InstructionCost BaseCost = 2;
unsigned VL = cast<FixedVectorType>(VTy)->getNumElements();		unsigned VL = cast<FixedVectorType>(VTy)->getNumElements();
std::pair<InstructionCost, MVT> LT = TLI->getTypeLegalizationCost(DL, VTy);

if (TTI::requiresOrderedReduction(FMF))		if (TTI::requiresOrderedReduction(FMF))
return (LT.first - 1) + BaseCost + VL;		return (LT.first - 1) + BaseCost + VL;
return (LT.first - 1) + BaseCost + Log2_32_Ceil(VL);		return (LT.first - 1) + BaseCost + Log2_32_Ceil(VL);
}		}

void RISCVTTIImpl::getUnrollingPreferences(Loop *L, ScalarEvolution &SE,		void RISCVTTIImpl::getUnrollingPreferences(Loop *L, ScalarEvolution &SE,
TTI::UnrollingPreferences &UP,		TTI::UnrollingPreferences &UP,
OptimizationRemarkEmitter *ORE) {		OptimizationRemarkEmitter *ORE) {
▲ Show 20 Lines • Show All 92 Lines • Show Last 20 Lines

llvm/test/Analysis/CostModel/RISCV/reduce-add.ll

	; NOTE: Assertions have been autogenerated by utils/update_analyze_test_checks.py			; NOTE: Assertions have been autogenerated by utils/update_analyze_test_checks.py
	; RUN: opt < %s -mtriple=riscv32 -mattr=+v -riscv-v-vector-bits-min=256 -passes='print<cost-model>' -cost-kind=throughput 2>&1 -disable-output \| FileCheck %s			; RUN: opt < %s -mtriple=riscv32 -mattr=+v -riscv-v-vector-bits-min=256 -passes='print<cost-model>' -cost-kind=throughput 2>&1 -disable-output \| FileCheck %s
	; RUN: opt < %s -mtriple=riscv64 -mattr=+v -riscv-v-vector-bits-min=256 -passes='print<cost-model>' -cost-kind=throughput 2>&1 -disable-output \| FileCheck %s			; RUN: opt < %s -mtriple=riscv64 -mattr=+v -riscv-v-vector-bits-min=256 -passes='print<cost-model>' -cost-kind=throughput 2>&1 -disable-output \| FileCheck %s

	define i32 @reduce_i1(i32 %arg) {			define i32 @reduce_i1(i32 %arg) {
	; CHECK-LABEL: 'reduce_i1'			; CHECK-LABEL: 'reduce_i1'
	; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %V1 = call i1 @llvm.vector.reduce.add.v1i1(<1 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i1 @llvm.vector.reduce.add.v1i1(<1 x i1> undef)
				Miss_GrapeUnsubmitted Not Done Reply Inline Actions why the costModel of v1i1 is not 5 but 2 Miss_Grape: why the costModel of v1i1 is not 5 but 2 {F24240693}
	; CHECK-NEXT: Cost Model: Found an estimated cost of 11 for instruction: %V2 = call i1 @llvm.vector.reduce.add.v2i1(<2 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V2 = call i1 @llvm.vector.reduce.add.v2i1(<2 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 41 for instruction: %V4 = call i1 @llvm.vector.reduce.add.v4i1(<4 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V4 = call i1 @llvm.vector.reduce.add.v4i1(<4 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 121 for instruction: %V8 = call i1 @llvm.vector.reduce.add.v8i1(<8 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V8 = call i1 @llvm.vector.reduce.add.v8i1(<8 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 321 for instruction: %V16 = call i1 @llvm.vector.reduce.add.v16i1(<16 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V16 = call i1 @llvm.vector.reduce.add.v16i1(<16 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 801 for instruction: %V32 = call i1 @llvm.vector.reduce.add.v32i1(<32 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V32 = call i1 @llvm.vector.reduce.add.v32i1(<32 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 1921 for instruction: %V64 = call i1 @llvm.vector.reduce.add.v64i1(<64 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V64 = call i1 @llvm.vector.reduce.add.v64i1(<64 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 4481 for instruction: %V128 = call i1 @llvm.vector.reduce.add.v128i1(<128 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V128 = call i1 @llvm.vector.reduce.add.v128i1(<128 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef			; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef
	;			;
	%V1 = call i1 @llvm.vector.reduce.add.v1i1(<1 x i1> undef)			%V1 = call i1 @llvm.vector.reduce.add.v1i1(<1 x i1> undef)
	%V2 = call i1 @llvm.vector.reduce.add.v2i1(<2 x i1> undef)			%V2 = call i1 @llvm.vector.reduce.add.v2i1(<2 x i1> undef)
	%V4 = call i1 @llvm.vector.reduce.add.v4i1(<4 x i1> undef)			%V4 = call i1 @llvm.vector.reduce.add.v4i1(<4 x i1> undef)
	%V8 = call i1 @llvm.vector.reduce.add.v8i1(<8 x i1> undef)			%V8 = call i1 @llvm.vector.reduce.add.v8i1(<8 x i1> undef)
	%V16 = call i1 @llvm.vector.reduce.add.v16i1(<16 x i1> undef)			%V16 = call i1 @llvm.vector.reduce.add.v16i1(<16 x i1> undef)
	%V32 = call i1 @llvm.vector.reduce.add.v32i1(<32 x i1> undef)			%V32 = call i1 @llvm.vector.reduce.add.v32i1(<32 x i1> undef)
	▲ Show 20 Lines • Show All 137 Lines • Show Last 20 Lines

llvm/test/Analysis/CostModel/RISCV/reduce-and.ll

	; NOTE: Assertions have been autogenerated by utils/update_analyze_test_checks.py			; NOTE: Assertions have been autogenerated by utils/update_analyze_test_checks.py
	; RUN: opt < %s -mtriple=riscv32 -mattr=+v -riscv-v-vector-bits-min=256 -passes='print<cost-model>' -cost-kind=throughput 2>&1 -disable-output \| FileCheck %s --check-prefixes=CHECK,RISCV32			; RUN: opt < %s -mtriple=riscv32 -mattr=+v -riscv-v-vector-bits-min=256 -passes='print<cost-model>' -cost-kind=throughput 2>&1 -disable-output \| FileCheck %s
	; RUN: opt < %s -mtriple=riscv64 -mattr=+v -riscv-v-vector-bits-min=256 -passes='print<cost-model>' -cost-kind=throughput 2>&1 -disable-output \| FileCheck %s --check-prefixes=CHECK,RISCV64			; RUN: opt < %s -mtriple=riscv64 -mattr=+v -riscv-v-vector-bits-min=256 -passes='print<cost-model>' -cost-kind=throughput 2>&1 -disable-output \| FileCheck %s

	define i32 @reduce_i1(i32 %arg) {			define i32 @reduce_i1(i32 %arg) {
	; RISCV32-LABEL: 'reduce_i1'			; CHECK-LABEL: 'reduce_i1'
	; RISCV32-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %V1 = call i1 @llvm.vector.reduce.and.v1i1(<1 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V1 = call i1 @llvm.vector.reduce.and.v1i1(<1 x i1> undef)
	; RISCV32-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i1 @llvm.vector.reduce.and.v2i1(<2 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i1 @llvm.vector.reduce.and.v2i1(<2 x i1> undef)
	; RISCV32-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V4 = call i1 @llvm.vector.reduce.and.v4i1(<4 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V4 = call i1 @llvm.vector.reduce.and.v4i1(<4 x i1> undef)
	; RISCV32-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %V8 = call i1 @llvm.vector.reduce.and.v8i1(<8 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V8 = call i1 @llvm.vector.reduce.and.v8i1(<8 x i1> undef)
	; RISCV32-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %V16 = call i1 @llvm.vector.reduce.and.v16i1(<16 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V16 = call i1 @llvm.vector.reduce.and.v16i1(<16 x i1> undef)
	; RISCV32-NEXT: Cost Model: Found an estimated cost of 33 for instruction: %V32 = call i1 @llvm.vector.reduce.and.v32i1(<32 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V32 = call i1 @llvm.vector.reduce.and.v32i1(<32 x i1> undef)
	; RISCV32-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %V64 = call i1 @llvm.vector.reduce.and.v64i1(<64 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V64 = call i1 @llvm.vector.reduce.and.v64i1(<64 x i1> undef)
	; RISCV32-NEXT: Cost Model: Found an estimated cost of 132 for instruction: %V128 = call i1 @llvm.vector.reduce.and.v128i1(<128 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V128 = call i1 @llvm.vector.reduce.and.v128i1(<128 x i1> undef)
	; RISCV32-NEXT: Cost Model: Found an estimated cost of 264 for instruction: %V256 = call i1 @llvm.vector.reduce.and.v256i1(<256 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V256 = call i1 @llvm.vector.reduce.and.v256i1(<256 x i1> undef)
	; RISCV32-NEXT: Cost Model: Found an estimated cost of 528 for instruction: %V512 = call i1 @llvm.vector.reduce.and.v512i1(<512 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V512 = call i1 @llvm.vector.reduce.and.v512i1(<512 x i1> undef)
	; RISCV32-NEXT: Cost Model: Found an estimated cost of 1056 for instruction: %V1024 = call i1 @llvm.vector.reduce.and.v1024i1(<1024 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V1024 = call i1 @llvm.vector.reduce.and.v1024i1(<1024 x i1> undef)
	; RISCV32-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef			; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef
	;
	; RISCV64-LABEL: 'reduce_i1'
	; RISCV64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %V1 = call i1 @llvm.vector.reduce.and.v1i1(<1 x i1> undef)
	; RISCV64-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i1 @llvm.vector.reduce.and.v2i1(<2 x i1> undef)
	; RISCV64-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V4 = call i1 @llvm.vector.reduce.and.v4i1(<4 x i1> undef)
	; RISCV64-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %V8 = call i1 @llvm.vector.reduce.and.v8i1(<8 x i1> undef)
	; RISCV64-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %V16 = call i1 @llvm.vector.reduce.and.v16i1(<16 x i1> undef)
	; RISCV64-NEXT: Cost Model: Found an estimated cost of 33 for instruction: %V32 = call i1 @llvm.vector.reduce.and.v32i1(<32 x i1> undef)
	; RISCV64-NEXT: Cost Model: Found an estimated cost of 65 for instruction: %V64 = call i1 @llvm.vector.reduce.and.v64i1(<64 x i1> undef)
	; RISCV64-NEXT: Cost Model: Found an estimated cost of 130 for instruction: %V128 = call i1 @llvm.vector.reduce.and.v128i1(<128 x i1> undef)
	; RISCV64-NEXT: Cost Model: Found an estimated cost of 260 for instruction: %V256 = call i1 @llvm.vector.reduce.and.v256i1(<256 x i1> undef)
	; RISCV64-NEXT: Cost Model: Found an estimated cost of 520 for instruction: %V512 = call i1 @llvm.vector.reduce.and.v512i1(<512 x i1> undef)
	; RISCV64-NEXT: Cost Model: Found an estimated cost of 1040 for instruction: %V1024 = call i1 @llvm.vector.reduce.and.v1024i1(<1024 x i1> undef)
	; RISCV64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef
	;			;
	%V1 = call i1 @llvm.vector.reduce.and.v1i1(<1 x i1> undef)			%V1 = call i1 @llvm.vector.reduce.and.v1i1(<1 x i1> undef)
	%V2 = call i1 @llvm.vector.reduce.and.v2i1(<2 x i1> undef)			%V2 = call i1 @llvm.vector.reduce.and.v2i1(<2 x i1> undef)
	%V4 = call i1 @llvm.vector.reduce.and.v4i1(<4 x i1> undef)			%V4 = call i1 @llvm.vector.reduce.and.v4i1(<4 x i1> undef)
	%V8 = call i1 @llvm.vector.reduce.and.v8i1(<8 x i1> undef)			%V8 = call i1 @llvm.vector.reduce.and.v8i1(<8 x i1> undef)
	%V16 = call i1 @llvm.vector.reduce.and.v16i1(<16 x i1> undef)			%V16 = call i1 @llvm.vector.reduce.and.v16i1(<16 x i1> undef)
	%V32 = call i1 @llvm.vector.reduce.and.v32i1(<32 x i1> undef)			%V32 = call i1 @llvm.vector.reduce.and.v32i1(<32 x i1> undef)
	%V64 = call i1 @llvm.vector.reduce.and.v64i1(<64 x i1> undef)			%V64 = call i1 @llvm.vector.reduce.and.v64i1(<64 x i1> undef)
	▲ Show 20 Lines • Show All 142 Lines • Show Last 20 Lines

llvm/test/Analysis/CostModel/RISCV/reduce-max.ll

	; NOTE: Assertions have been autogenerated by utils/update_analyze_test_checks.py			; NOTE: Assertions have been autogenerated by utils/update_analyze_test_checks.py
	; RUN: opt < %s -mtriple=riscv32 -mattr=+v -riscv-v-vector-bits-min=256 -passes='print<cost-model>' -cost-kind=throughput 2>&1 -disable-output \| FileCheck %s			; RUN: opt < %s -mtriple=riscv32 -mattr=+v -riscv-v-vector-bits-min=256 -passes='print<cost-model>' -cost-kind=throughput 2>&1 -disable-output \| FileCheck %s
	; RUN: opt < %s -mtriple=riscv64 -mattr=+v -riscv-v-vector-bits-min=256 -passes='print<cost-model>' -cost-kind=throughput 2>&1 -disable-output \| FileCheck %s			; RUN: opt < %s -mtriple=riscv64 -mattr=+v -riscv-v-vector-bits-min=256 -passes='print<cost-model>' -cost-kind=throughput 2>&1 -disable-output \| FileCheck %s

	define i32 @reduce_umin_i1(i32 %arg) {			define i32 @reduce_umin_i1(i32 %arg) {
	; CHECK-LABEL: 'reduce_umin_i1'			; CHECK-LABEL: 'reduce_umin_i1'
	; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i1 @llvm.vector.reduce.umax.v1i1(<1 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V1 = call i1 @llvm.vector.reduce.umax.v1i1(<1 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i1 @llvm.vector.reduce.umax.v2i1(<2 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i1 @llvm.vector.reduce.umax.v2i1(<2 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i1 @llvm.vector.reduce.umax.v4i1(<4 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V4 = call i1 @llvm.vector.reduce.umax.v4i1(<4 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i1 @llvm.vector.reduce.umax.v8i1(<8 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V8 = call i1 @llvm.vector.reduce.umax.v8i1(<8 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i1 @llvm.vector.reduce.umax.v16i1(<16 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V16 = call i1 @llvm.vector.reduce.umax.v16i1(<16 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i1 @llvm.vector.reduce.umax.v32i1(<32 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V32 = call i1 @llvm.vector.reduce.umax.v32i1(<32 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V64 = call i1 @llvm.vector.reduce.umax.v64i1(<64 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V64 = call i1 @llvm.vector.reduce.umax.v64i1(<64 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %V128 = call i1 @llvm.vector.reduce.umax.v128i1(<128 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V128 = call i1 @llvm.vector.reduce.umax.v128i1(<128 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef			; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef
				;
	%V1 = call i1 @llvm.vector.reduce.umax.v1i1(<1 x i1> undef)			%V1 = call i1 @llvm.vector.reduce.umax.v1i1(<1 x i1> undef)
	%V2 = call i1 @llvm.vector.reduce.umax.v2i1(<2 x i1> undef)			%V2 = call i1 @llvm.vector.reduce.umax.v2i1(<2 x i1> undef)
	%V4 = call i1 @llvm.vector.reduce.umax.v4i1(<4 x i1> undef)			%V4 = call i1 @llvm.vector.reduce.umax.v4i1(<4 x i1> undef)
	%V8 = call i1 @llvm.vector.reduce.umax.v8i1(<8 x i1> undef)			%V8 = call i1 @llvm.vector.reduce.umax.v8i1(<8 x i1> undef)
	%V16 = call i1 @llvm.vector.reduce.umax.v16i1(<16 x i1> undef)			%V16 = call i1 @llvm.vector.reduce.umax.v16i1(<16 x i1> undef)
	%V32 = call i1 @llvm.vector.reduce.umax.v32i1(<32 x i1> undef)			%V32 = call i1 @llvm.vector.reduce.umax.v32i1(<32 x i1> undef)
	%V64 = call i1 @llvm.vector.reduce.umax.v64i1(<64 x i1> undef)			%V64 = call i1 @llvm.vector.reduce.umax.v64i1(<64 x i1> undef)
	%V128 = call i1 @llvm.vector.reduce.umax.v128i1(<128 x i1> undef)			%V128 = call i1 @llvm.vector.reduce.umax.v128i1(<128 x i1> undef)
	ret i32 undef			ret i32 undef
	}			}

	define i32 @reduce_umax_i8(i32 %arg) {			define i32 @reduce_umax_i8(i32 %arg) {
	; CHECK-LABEL: 'reduce_umax_i8'			; CHECK-LABEL: 'reduce_umax_i8'
	; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i8 @llvm.vector.reduce.umax.v1i8(<1 x i8> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i8 @llvm.vector.reduce.umax.v1i8(<1 x i8> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i8 @llvm.vector.reduce.umax.v2i8(<2 x i8> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i8 @llvm.vector.reduce.umax.v2i8(<2 x i8> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i8 @llvm.vector.reduce.umax.v4i8(<4 x i8> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i8 @llvm.vector.reduce.umax.v4i8(<4 x i8> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i8 @llvm.vector.reduce.umax.v8i8(<8 x i8> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i8 @llvm.vector.reduce.umax.v8i8(<8 x i8> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i8 @llvm.vector.reduce.umax.v16i8(<16 x i8> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i8 @llvm.vector.reduce.umax.v16i8(<16 x i8> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i8 @llvm.vector.reduce.umax.v32i8(<32 x i8> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i8 @llvm.vector.reduce.umax.v32i8(<32 x i8> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V64 = call i8 @llvm.vector.reduce.umax.v64i8(<64 x i8> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V64 = call i8 @llvm.vector.reduce.umax.v64i8(<64 x i8> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %V128 = call i8 @llvm.vector.reduce.umax.v128i8(<128 x i8> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %V128 = call i8 @llvm.vector.reduce.umax.v128i8(<128 x i8> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef			; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef
				;
	%V1 = call i8 @llvm.vector.reduce.umax.v1i8(<1 x i8> undef)			%V1 = call i8 @llvm.vector.reduce.umax.v1i8(<1 x i8> undef)
	%V2 = call i8 @llvm.vector.reduce.umax.v2i8(<2 x i8> undef)			%V2 = call i8 @llvm.vector.reduce.umax.v2i8(<2 x i8> undef)
	%V4 = call i8 @llvm.vector.reduce.umax.v4i8(<4 x i8> undef)			%V4 = call i8 @llvm.vector.reduce.umax.v4i8(<4 x i8> undef)
	%V8 = call i8 @llvm.vector.reduce.umax.v8i8(<8 x i8> undef)			%V8 = call i8 @llvm.vector.reduce.umax.v8i8(<8 x i8> undef)
	%V16 = call i8 @llvm.vector.reduce.umax.v16i8(<16 x i8> undef)			%V16 = call i8 @llvm.vector.reduce.umax.v16i8(<16 x i8> undef)
	%V32 = call i8 @llvm.vector.reduce.umax.v32i8(<32 x i8> undef)			%V32 = call i8 @llvm.vector.reduce.umax.v32i8(<32 x i8> undef)
	%V64 = call i8 @llvm.vector.reduce.umax.v64i8(<64 x i8> undef)			%V64 = call i8 @llvm.vector.reduce.umax.v64i8(<64 x i8> undef)
	%V128 = call i8 @llvm.vector.reduce.umax.v128i8(<128 x i8> undef)			%V128 = call i8 @llvm.vector.reduce.umax.v128i8(<128 x i8> undef)
	ret i32 undef			ret i32 undef
	}			}

	define i32 @reduce_umax_i16(i32 %arg) {			define i32 @reduce_umax_i16(i32 %arg) {
	; CHECK-LABEL: 'reduce_umax_i16'			; CHECK-LABEL: 'reduce_umax_i16'
	; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i16 @llvm.vector.reduce.umax.v1i16(<1 x i16> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i16 @llvm.vector.reduce.umax.v1i16(<1 x i16> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i16 @llvm.vector.reduce.umax.v2i16(<2 x i16> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i16 @llvm.vector.reduce.umax.v2i16(<2 x i16> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i16 @llvm.vector.reduce.umax.v4i16(<4 x i16> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i16 @llvm.vector.reduce.umax.v4i16(<4 x i16> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i16 @llvm.vector.reduce.umax.v8i16(<8 x i16> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i16 @llvm.vector.reduce.umax.v8i16(<8 x i16> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i16 @llvm.vector.reduce.umax.v16i16(<16 x i16> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i16 @llvm.vector.reduce.umax.v16i16(<16 x i16> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i16 @llvm.vector.reduce.umax.v32i16(<32 x i16> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i16 @llvm.vector.reduce.umax.v32i16(<32 x i16> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V64 = call i16 @llvm.vector.reduce.umax.v64i16(<64 x i16> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V64 = call i16 @llvm.vector.reduce.umax.v64i16(<64 x i16> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %V128 = call i16 @llvm.vector.reduce.umax.v128i16(<128 x i16> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %V128 = call i16 @llvm.vector.reduce.umax.v128i16(<128 x i16> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef			; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef
				;
	%V1 = call i16 @llvm.vector.reduce.umax.v1i16(<1 x i16> undef)			%V1 = call i16 @llvm.vector.reduce.umax.v1i16(<1 x i16> undef)
	%V2 = call i16 @llvm.vector.reduce.umax.v2i16(<2 x i16> undef)			%V2 = call i16 @llvm.vector.reduce.umax.v2i16(<2 x i16> undef)
	%V4 = call i16 @llvm.vector.reduce.umax.v4i16(<4 x i16> undef)			%V4 = call i16 @llvm.vector.reduce.umax.v4i16(<4 x i16> undef)
	%V8 = call i16 @llvm.vector.reduce.umax.v8i16(<8 x i16> undef)			%V8 = call i16 @llvm.vector.reduce.umax.v8i16(<8 x i16> undef)
	%V16 = call i16 @llvm.vector.reduce.umax.v16i16(<16 x i16> undef)			%V16 = call i16 @llvm.vector.reduce.umax.v16i16(<16 x i16> undef)
	%V32 = call i16 @llvm.vector.reduce.umax.v32i16(<32 x i16> undef)			%V32 = call i16 @llvm.vector.reduce.umax.v32i16(<32 x i16> undef)
	%V64 = call i16 @llvm.vector.reduce.umax.v64i16(<64 x i16> undef)			%V64 = call i16 @llvm.vector.reduce.umax.v64i16(<64 x i16> undef)
	%V128 = call i16 @llvm.vector.reduce.umax.v128i16(<128 x i16> undef)			%V128 = call i16 @llvm.vector.reduce.umax.v128i16(<128 x i16> undef)
	ret i32 undef			ret i32 undef
	}			}

	define i32 @reduce_umax_i32(i32 %arg) {			define i32 @reduce_umax_i32(i32 %arg) {
	; CHECK-LABEL: 'reduce_umax_i32'			; CHECK-LABEL: 'reduce_umax_i32'
	; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i32 @llvm.vector.reduce.umax.v1i32(<1 x i32> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i32 @llvm.vector.reduce.umax.v1i32(<1 x i32> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i32 @llvm.vector.reduce.umax.v2i32(<2 x i32> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i32 @llvm.vector.reduce.umax.v2i32(<2 x i32> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i32 @llvm.vector.reduce.umax.v4i32(<4 x i32> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i32 @llvm.vector.reduce.umax.v4i32(<4 x i32> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i32 @llvm.vector.reduce.umax.v8i32(<8 x i32> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i32 @llvm.vector.reduce.umax.v8i32(<8 x i32> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i32 @llvm.vector.reduce.umax.v16i32(<16 x i32> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i32 @llvm.vector.reduce.umax.v16i32(<16 x i32> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i32 @llvm.vector.reduce.umax.v32i32(<32 x i32> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i32 @llvm.vector.reduce.umax.v32i32(<32 x i32> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V64 = call i32 @llvm.vector.reduce.umax.v64i32(<64 x i32> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V64 = call i32 @llvm.vector.reduce.umax.v64i32(<64 x i32> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 10 for instruction: %V128 = call i32 @llvm.vector.reduce.umax.v128i32(<128 x i32> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 10 for instruction: %V128 = call i32 @llvm.vector.reduce.umax.v128i32(<128 x i32> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef			; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef
				;
	%V1 = call i32 @llvm.vector.reduce.umax.v1i32(<1 x i32> undef)			%V1 = call i32 @llvm.vector.reduce.umax.v1i32(<1 x i32> undef)
	%V2 = call i32 @llvm.vector.reduce.umax.v2i32(<2 x i32> undef)			%V2 = call i32 @llvm.vector.reduce.umax.v2i32(<2 x i32> undef)
	%V4 = call i32 @llvm.vector.reduce.umax.v4i32(<4 x i32> undef)			%V4 = call i32 @llvm.vector.reduce.umax.v4i32(<4 x i32> undef)
	%V8 = call i32 @llvm.vector.reduce.umax.v8i32(<8 x i32> undef)			%V8 = call i32 @llvm.vector.reduce.umax.v8i32(<8 x i32> undef)
	%V16 = call i32 @llvm.vector.reduce.umax.v16i32(<16 x i32> undef)			%V16 = call i32 @llvm.vector.reduce.umax.v16i32(<16 x i32> undef)
	%V32 = call i32 @llvm.vector.reduce.umax.v32i32(<32 x i32> undef)			%V32 = call i32 @llvm.vector.reduce.umax.v32i32(<32 x i32> undef)
	%V64 = call i32 @llvm.vector.reduce.umax.v64i32(<64 x i32> undef)			%V64 = call i32 @llvm.vector.reduce.umax.v64i32(<64 x i32> undef)
	%V128 = call i32 @llvm.vector.reduce.umax.v128i32(<128 x i32> undef)			%V128 = call i32 @llvm.vector.reduce.umax.v128i32(<128 x i32> undef)
	ret i32 undef			ret i32 undef
	}			}

	define i32 @reduce_umax_i64(i32 %arg) {			define i32 @reduce_umax_i64(i32 %arg) {
	; CHECK-LABEL: 'reduce_umax_i64'			; CHECK-LABEL: 'reduce_umax_i64'
	; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i64 @llvm.vector.reduce.umax.v1i64(<1 x i64> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i64 @llvm.vector.reduce.umax.v1i64(<1 x i64> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i64 @llvm.vector.reduce.umax.v2i64(<2 x i64> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i64 @llvm.vector.reduce.umax.v2i64(<2 x i64> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i64 @llvm.vector.reduce.umax.v4i64(<4 x i64> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i64 @llvm.vector.reduce.umax.v4i64(<4 x i64> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i64 @llvm.vector.reduce.umax.v8i64(<8 x i64> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i64 @llvm.vector.reduce.umax.v8i64(<8 x i64> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i64 @llvm.vector.reduce.umax.v16i64(<16 x i64> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i64 @llvm.vector.reduce.umax.v16i64(<16 x i64> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i64 @llvm.vector.reduce.umax.v32i64(<32 x i64> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i64 @llvm.vector.reduce.umax.v32i64(<32 x i64> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %V64 = call i64 @llvm.vector.reduce.umax.v64i64(<64 x i64> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %V64 = call i64 @llvm.vector.reduce.umax.v64i64(<64 x i64> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 12 for instruction: %V128 = call i64 @llvm.vector.reduce.umax.v128i64(<128 x i64> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 12 for instruction: %V128 = call i64 @llvm.vector.reduce.umax.v128i64(<128 x i64> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef			; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef
				;
	%V1 = call i64 @llvm.vector.reduce.umax.v1i64(<1 x i64> undef)			%V1 = call i64 @llvm.vector.reduce.umax.v1i64(<1 x i64> undef)
	%V2 = call i64 @llvm.vector.reduce.umax.v2i64(<2 x i64> undef)			%V2 = call i64 @llvm.vector.reduce.umax.v2i64(<2 x i64> undef)
	%V4 = call i64 @llvm.vector.reduce.umax.v4i64(<4 x i64> undef)			%V4 = call i64 @llvm.vector.reduce.umax.v4i64(<4 x i64> undef)
	%V8 = call i64 @llvm.vector.reduce.umax.v8i64(<8 x i64> undef)			%V8 = call i64 @llvm.vector.reduce.umax.v8i64(<8 x i64> undef)
	%V16 = call i64 @llvm.vector.reduce.umax.v16i64(<16 x i64> undef)			%V16 = call i64 @llvm.vector.reduce.umax.v16i64(<16 x i64> undef)
	%V32 = call i64 @llvm.vector.reduce.umax.v32i64(<32 x i64> undef)			%V32 = call i64 @llvm.vector.reduce.umax.v32i64(<32 x i64> undef)
	%V64 = call i64 @llvm.vector.reduce.umax.v64i64(<64 x i64> undef)			%V64 = call i64 @llvm.vector.reduce.umax.v64i64(<64 x i64> undef)
	%V128 = call i64 @llvm.vector.reduce.umax.v128i64(<128 x i64> undef)			%V128 = call i64 @llvm.vector.reduce.umax.v128i64(<128 x i64> undef)
	ret i32 undef			ret i32 undef
	}			}

	define i32 @reduce_smin_i1(i32 %arg) {			define i32 @reduce_smin_i1(i32 %arg) {
	; CHECK-LABEL: 'reduce_smin_i1'			; CHECK-LABEL: 'reduce_smin_i1'
	; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i1 @llvm.vector.reduce.smax.v1i1(<1 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V1 = call i1 @llvm.vector.reduce.smax.v1i1(<1 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i1 @llvm.vector.reduce.smax.v2i1(<2 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i1 @llvm.vector.reduce.smax.v2i1(<2 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i1 @llvm.vector.reduce.smax.v4i1(<4 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V4 = call i1 @llvm.vector.reduce.smax.v4i1(<4 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i1 @llvm.vector.reduce.smax.v8i1(<8 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V8 = call i1 @llvm.vector.reduce.smax.v8i1(<8 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i1 @llvm.vector.reduce.smax.v16i1(<16 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V16 = call i1 @llvm.vector.reduce.smax.v16i1(<16 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i1 @llvm.vector.reduce.smax.v32i1(<32 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V32 = call i1 @llvm.vector.reduce.smax.v32i1(<32 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V64 = call i1 @llvm.vector.reduce.smax.v64i1(<64 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V64 = call i1 @llvm.vector.reduce.smax.v64i1(<64 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %V128 = call i1 @llvm.vector.reduce.smax.v128i1(<128 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V128 = call i1 @llvm.vector.reduce.smax.v128i1(<128 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef			; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef
				;
	%V1 = call i1 @llvm.vector.reduce.smax.v1i1(<1 x i1> undef)			%V1 = call i1 @llvm.vector.reduce.smax.v1i1(<1 x i1> undef)
	%V2 = call i1 @llvm.vector.reduce.smax.v2i1(<2 x i1> undef)			%V2 = call i1 @llvm.vector.reduce.smax.v2i1(<2 x i1> undef)
	%V4 = call i1 @llvm.vector.reduce.smax.v4i1(<4 x i1> undef)			%V4 = call i1 @llvm.vector.reduce.smax.v4i1(<4 x i1> undef)
	%V8 = call i1 @llvm.vector.reduce.smax.v8i1(<8 x i1> undef)			%V8 = call i1 @llvm.vector.reduce.smax.v8i1(<8 x i1> undef)
	%V16 = call i1 @llvm.vector.reduce.smax.v16i1(<16 x i1> undef)			%V16 = call i1 @llvm.vector.reduce.smax.v16i1(<16 x i1> undef)
	%V32 = call i1 @llvm.vector.reduce.smax.v32i1(<32 x i1> undef)			%V32 = call i1 @llvm.vector.reduce.smax.v32i1(<32 x i1> undef)
	%V64 = call i1 @llvm.vector.reduce.smax.v64i1(<64 x i1> undef)			%V64 = call i1 @llvm.vector.reduce.smax.v64i1(<64 x i1> undef)
	%V128 = call i1 @llvm.vector.reduce.smax.v128i1(<128 x i1> undef)			%V128 = call i1 @llvm.vector.reduce.smax.v128i1(<128 x i1> undef)
	ret i32 undef			ret i32 undef
	}			}

	define i32 @reduce_smax_i8(i32 %arg) {			define i32 @reduce_smax_i8(i32 %arg) {
	; CHECK-LABEL: 'reduce_smax_i8'			; CHECK-LABEL: 'reduce_smax_i8'
	; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i8 @llvm.vector.reduce.smax.v1i8(<1 x i8> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i8 @llvm.vector.reduce.smax.v1i8(<1 x i8> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i8 @llvm.vector.reduce.smax.v2i8(<2 x i8> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i8 @llvm.vector.reduce.smax.v2i8(<2 x i8> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i8 @llvm.vector.reduce.smax.v4i8(<4 x i8> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i8 @llvm.vector.reduce.smax.v4i8(<4 x i8> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i8 @llvm.vector.reduce.smax.v8i8(<8 x i8> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i8 @llvm.vector.reduce.smax.v8i8(<8 x i8> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i8 @llvm.vector.reduce.smax.v16i8(<16 x i8> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i8 @llvm.vector.reduce.smax.v16i8(<16 x i8> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i8 @llvm.vector.reduce.smax.v32i8(<32 x i8> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i8 @llvm.vector.reduce.smax.v32i8(<32 x i8> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V64 = call i8 @llvm.vector.reduce.smax.v64i8(<64 x i8> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V64 = call i8 @llvm.vector.reduce.smax.v64i8(<64 x i8> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %V128 = call i8 @llvm.vector.reduce.smax.v128i8(<128 x i8> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %V128 = call i8 @llvm.vector.reduce.smax.v128i8(<128 x i8> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef			; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef
				;
	%V1 = call i8 @llvm.vector.reduce.smax.v1i8(<1 x i8> undef)			%V1 = call i8 @llvm.vector.reduce.smax.v1i8(<1 x i8> undef)
	%V2 = call i8 @llvm.vector.reduce.smax.v2i8(<2 x i8> undef)			%V2 = call i8 @llvm.vector.reduce.smax.v2i8(<2 x i8> undef)
	%V4 = call i8 @llvm.vector.reduce.smax.v4i8(<4 x i8> undef)			%V4 = call i8 @llvm.vector.reduce.smax.v4i8(<4 x i8> undef)
	%V8 = call i8 @llvm.vector.reduce.smax.v8i8(<8 x i8> undef)			%V8 = call i8 @llvm.vector.reduce.smax.v8i8(<8 x i8> undef)
	%V16 = call i8 @llvm.vector.reduce.smax.v16i8(<16 x i8> undef)			%V16 = call i8 @llvm.vector.reduce.smax.v16i8(<16 x i8> undef)
	%V32 = call i8 @llvm.vector.reduce.smax.v32i8(<32 x i8> undef)			%V32 = call i8 @llvm.vector.reduce.smax.v32i8(<32 x i8> undef)
	%V64 = call i8 @llvm.vector.reduce.smax.v64i8(<64 x i8> undef)			%V64 = call i8 @llvm.vector.reduce.smax.v64i8(<64 x i8> undef)
	%V128 = call i8 @llvm.vector.reduce.smax.v128i8(<128 x i8> undef)			%V128 = call i8 @llvm.vector.reduce.smax.v128i8(<128 x i8> undef)
	ret i32 undef			ret i32 undef
	}			}

	define i32 @reduce_smax_i16(i32 %arg) {			define i32 @reduce_smax_i16(i32 %arg) {
	; CHECK-LABEL: 'reduce_smax_i16'			; CHECK-LABEL: 'reduce_smax_i16'
	; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i16 @llvm.vector.reduce.smax.v1i16(<1 x i16> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i16 @llvm.vector.reduce.smax.v1i16(<1 x i16> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i16 @llvm.vector.reduce.smax.v2i16(<2 x i16> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i16 @llvm.vector.reduce.smax.v2i16(<2 x i16> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i16 @llvm.vector.reduce.smax.v4i16(<4 x i16> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i16 @llvm.vector.reduce.smax.v4i16(<4 x i16> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i16 @llvm.vector.reduce.smax.v8i16(<8 x i16> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i16 @llvm.vector.reduce.smax.v8i16(<8 x i16> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i16 @llvm.vector.reduce.smax.v16i16(<16 x i16> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i16 @llvm.vector.reduce.smax.v16i16(<16 x i16> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i16 @llvm.vector.reduce.smax.v32i16(<32 x i16> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i16 @llvm.vector.reduce.smax.v32i16(<32 x i16> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V64 = call i16 @llvm.vector.reduce.smax.v64i16(<64 x i16> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V64 = call i16 @llvm.vector.reduce.smax.v64i16(<64 x i16> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %V128 = call i16 @llvm.vector.reduce.smax.v128i16(<128 x i16> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %V128 = call i16 @llvm.vector.reduce.smax.v128i16(<128 x i16> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef			; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef
				;
	%V1 = call i16 @llvm.vector.reduce.smax.v1i16(<1 x i16> undef)			%V1 = call i16 @llvm.vector.reduce.smax.v1i16(<1 x i16> undef)
	%V2 = call i16 @llvm.vector.reduce.smax.v2i16(<2 x i16> undef)			%V2 = call i16 @llvm.vector.reduce.smax.v2i16(<2 x i16> undef)
	%V4 = call i16 @llvm.vector.reduce.smax.v4i16(<4 x i16> undef)			%V4 = call i16 @llvm.vector.reduce.smax.v4i16(<4 x i16> undef)
				Miss_GrapeUnsubmitted Not Done Reply Inline Actions llvm.vector.reduce.smax.v2i16 and llvm.vector.reduce.smax.v4i16 have the same asemble, why llvm.vector.reduce.smax.v2i16: cost model 3 llvm.vector.reduce.smax.v4i16: cost model 4 Miss_Grape: llvm.vector.reduce.smax.v2i16 and llvm.vector.reduce.smax.v4i16 have the same asemble, why llvm.
	%V8 = call i16 @llvm.vector.reduce.smax.v8i16(<8 x i16> undef)			%V8 = call i16 @llvm.vector.reduce.smax.v8i16(<8 x i16> undef)
	%V16 = call i16 @llvm.vector.reduce.smax.v16i16(<16 x i16> undef)			%V16 = call i16 @llvm.vector.reduce.smax.v16i16(<16 x i16> undef)
	%V32 = call i16 @llvm.vector.reduce.smax.v32i16(<32 x i16> undef)			%V32 = call i16 @llvm.vector.reduce.smax.v32i16(<32 x i16> undef)
	%V64 = call i16 @llvm.vector.reduce.smax.v64i16(<64 x i16> undef)			%V64 = call i16 @llvm.vector.reduce.smax.v64i16(<64 x i16> undef)
	%V128 = call i16 @llvm.vector.reduce.smax.v128i16(<128 x i16> undef)			%V128 = call i16 @llvm.vector.reduce.smax.v128i16(<128 x i16> undef)
	ret i32 undef			ret i32 undef
	}			}

	define i32 @reduce_smax_i32(i32 %arg) {			define i32 @reduce_smax_i32(i32 %arg) {
	; CHECK-LABEL: 'reduce_smax_i32'			; CHECK-LABEL: 'reduce_smax_i32'
	; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i32 @llvm.vector.reduce.smax.v1i32(<1 x i32> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i32 @llvm.vector.reduce.smax.v1i32(<1 x i32> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i32 @llvm.vector.reduce.smax.v2i32(<2 x i32> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i32 @llvm.vector.reduce.smax.v2i32(<2 x i32> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i32 @llvm.vector.reduce.smax.v4i32(<4 x i32> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i32 @llvm.vector.reduce.smax.v4i32(<4 x i32> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i32 @llvm.vector.reduce.smax.v8i32(<8 x i32> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i32 @llvm.vector.reduce.smax.v8i32(<8 x i32> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i32 @llvm.vector.reduce.smax.v16i32(<16 x i32> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i32 @llvm.vector.reduce.smax.v16i32(<16 x i32> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i32 @llvm.vector.reduce.smax.v32i32(<32 x i32> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i32 @llvm.vector.reduce.smax.v32i32(<32 x i32> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V64 = call i32 @llvm.vector.reduce.smax.v64i32(<64 x i32> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V64 = call i32 @llvm.vector.reduce.smax.v64i32(<64 x i32> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 10 for instruction: %V128 = call i32 @llvm.vector.reduce.smax.v128i32(<128 x i32> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 10 for instruction: %V128 = call i32 @llvm.vector.reduce.smax.v128i32(<128 x i32> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef			; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef
				;
	%V1 = call i32 @llvm.vector.reduce.smax.v1i32(<1 x i32> undef)			%V1 = call i32 @llvm.vector.reduce.smax.v1i32(<1 x i32> undef)
	%V2 = call i32 @llvm.vector.reduce.smax.v2i32(<2 x i32> undef)			%V2 = call i32 @llvm.vector.reduce.smax.v2i32(<2 x i32> undef)
	%V4 = call i32 @llvm.vector.reduce.smax.v4i32(<4 x i32> undef)			%V4 = call i32 @llvm.vector.reduce.smax.v4i32(<4 x i32> undef)
	%V8 = call i32 @llvm.vector.reduce.smax.v8i32(<8 x i32> undef)			%V8 = call i32 @llvm.vector.reduce.smax.v8i32(<8 x i32> undef)
	%V16 = call i32 @llvm.vector.reduce.smax.v16i32(<16 x i32> undef)			%V16 = call i32 @llvm.vector.reduce.smax.v16i32(<16 x i32> undef)
	%V32 = call i32 @llvm.vector.reduce.smax.v32i32(<32 x i32> undef)			%V32 = call i32 @llvm.vector.reduce.smax.v32i32(<32 x i32> undef)
	%V64 = call i32 @llvm.vector.reduce.smax.v64i32(<64 x i32> undef)			%V64 = call i32 @llvm.vector.reduce.smax.v64i32(<64 x i32> undef)
	%V128 = call i32 @llvm.vector.reduce.smax.v128i32(<128 x i32> undef)			%V128 = call i32 @llvm.vector.reduce.smax.v128i32(<128 x i32> undef)
	ret i32 undef			ret i32 undef
	}			}

	define i32 @reduce_smax_i64(i32 %arg) {			define i32 @reduce_smax_i64(i32 %arg) {
	; CHECK-LABEL: 'reduce_smax_i64'			; CHECK-LABEL: 'reduce_smax_i64'
	; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i64 @llvm.vector.reduce.smax.v1i64(<1 x i64> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i64 @llvm.vector.reduce.smax.v1i64(<1 x i64> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i64 @llvm.vector.reduce.smax.v2i64(<2 x i64> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i64 @llvm.vector.reduce.smax.v2i64(<2 x i64> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i64 @llvm.vector.reduce.smax.v4i64(<4 x i64> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i64 @llvm.vector.reduce.smax.v4i64(<4 x i64> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i64 @llvm.vector.reduce.smax.v8i64(<8 x i64> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i64 @llvm.vector.reduce.smax.v8i64(<8 x i64> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i64 @llvm.vector.reduce.smax.v16i64(<16 x i64> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i64 @llvm.vector.reduce.smax.v16i64(<16 x i64> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i64 @llvm.vector.reduce.smax.v32i64(<32 x i64> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i64 @llvm.vector.reduce.smax.v32i64(<32 x i64> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %V64 = call i64 @llvm.vector.reduce.smax.v64i64(<64 x i64> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %V64 = call i64 @llvm.vector.reduce.smax.v64i64(<64 x i64> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 12 for instruction: %V128 = call i64 @llvm.vector.reduce.smax.v128i64(<128 x i64> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 12 for instruction: %V128 = call i64 @llvm.vector.reduce.smax.v128i64(<128 x i64> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef			; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef
				;
	%V1 = call i64 @llvm.vector.reduce.smax.v1i64(<1 x i64> undef)			%V1 = call i64 @llvm.vector.reduce.smax.v1i64(<1 x i64> undef)
	%V2 = call i64 @llvm.vector.reduce.smax.v2i64(<2 x i64> undef)			%V2 = call i64 @llvm.vector.reduce.smax.v2i64(<2 x i64> undef)
	%V4 = call i64 @llvm.vector.reduce.smax.v4i64(<4 x i64> undef)			%V4 = call i64 @llvm.vector.reduce.smax.v4i64(<4 x i64> undef)
	%V8 = call i64 @llvm.vector.reduce.smax.v8i64(<8 x i64> undef)			%V8 = call i64 @llvm.vector.reduce.smax.v8i64(<8 x i64> undef)
	%V16 = call i64 @llvm.vector.reduce.smax.v16i64(<16 x i64> undef)			%V16 = call i64 @llvm.vector.reduce.smax.v16i64(<16 x i64> undef)
	%V32 = call i64 @llvm.vector.reduce.smax.v32i64(<32 x i64> undef)			%V32 = call i64 @llvm.vector.reduce.smax.v32i64(<32 x i64> undef)
	%V64 = call i64 @llvm.vector.reduce.smax.v64i64(<64 x i64> undef)			%V64 = call i64 @llvm.vector.reduce.smax.v64i64(<64 x i64> undef)
	%V128 = call i64 @llvm.vector.reduce.smax.v128i64(<128 x i64> undef)			%V128 = call i64 @llvm.vector.reduce.smax.v128i64(<128 x i64> undef)
	▲ Show 20 Lines • Show All 84 Lines • Show Last 20 Lines

llvm/test/Analysis/CostModel/RISCV/reduce-min.ll

	; NOTE: Assertions have been autogenerated by utils/update_analyze_test_checks.py			; NOTE: Assertions have been autogenerated by utils/update_analyze_test_checks.py
	; RUN: opt < %s -mtriple=riscv32 -mattr=+v -riscv-v-vector-bits-min=256 -passes='print<cost-model>' -cost-kind=throughput 2>&1 -disable-output \| FileCheck %s			; RUN: opt < %s -mtriple=riscv32 -mattr=+v -riscv-v-vector-bits-min=256 -passes='print<cost-model>' -cost-kind=throughput 2>&1 -disable-output \| FileCheck %s
	; RUN: opt < %s -mtriple=riscv64 -mattr=+v -riscv-v-vector-bits-min=256 -passes='print<cost-model>' -cost-kind=throughput 2>&1 -disable-output \| FileCheck %s			; RUN: opt < %s -mtriple=riscv64 -mattr=+v -riscv-v-vector-bits-min=256 -passes='print<cost-model>' -cost-kind=throughput 2>&1 -disable-output \| FileCheck %s

	define i32 @reduce_umin_i1(i32 %arg) {			define i32 @reduce_umin_i1(i32 %arg) {
	; CHECK-LABEL: 'reduce_umin_i1'			; CHECK-LABEL: 'reduce_umin_i1'
	; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i1 @llvm.vector.reduce.umin.v1i1(<1 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V1 = call i1 @llvm.vector.reduce.umin.v1i1(<1 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i1 @llvm.vector.reduce.umin.v2i1(<2 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i1 @llvm.vector.reduce.umin.v2i1(<2 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i1 @llvm.vector.reduce.umin.v4i1(<4 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V4 = call i1 @llvm.vector.reduce.umin.v4i1(<4 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i1 @llvm.vector.reduce.umin.v8i1(<8 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V8 = call i1 @llvm.vector.reduce.umin.v8i1(<8 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i1 @llvm.vector.reduce.umin.v16i1(<16 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V16 = call i1 @llvm.vector.reduce.umin.v16i1(<16 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i1 @llvm.vector.reduce.umin.v32i1(<32 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V32 = call i1 @llvm.vector.reduce.umin.v32i1(<32 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V64 = call i1 @llvm.vector.reduce.umin.v64i1(<64 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V64 = call i1 @llvm.vector.reduce.umin.v64i1(<64 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %V128 = call i1 @llvm.vector.reduce.umin.v128i1(<128 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V128 = call i1 @llvm.vector.reduce.umin.v128i1(<128 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef			; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef
				;
	%V1 = call i1 @llvm.vector.reduce.umin.v1i1(<1 x i1> undef)			%V1 = call i1 @llvm.vector.reduce.umin.v1i1(<1 x i1> undef)
	%V2 = call i1 @llvm.vector.reduce.umin.v2i1(<2 x i1> undef)			%V2 = call i1 @llvm.vector.reduce.umin.v2i1(<2 x i1> undef)
	%V4 = call i1 @llvm.vector.reduce.umin.v4i1(<4 x i1> undef)			%V4 = call i1 @llvm.vector.reduce.umin.v4i1(<4 x i1> undef)
	%V8 = call i1 @llvm.vector.reduce.umin.v8i1(<8 x i1> undef)			%V8 = call i1 @llvm.vector.reduce.umin.v8i1(<8 x i1> undef)
	%V16 = call i1 @llvm.vector.reduce.umin.v16i1(<16 x i1> undef)			%V16 = call i1 @llvm.vector.reduce.umin.v16i1(<16 x i1> undef)
	%V32 = call i1 @llvm.vector.reduce.umin.v32i1(<32 x i1> undef)			%V32 = call i1 @llvm.vector.reduce.umin.v32i1(<32 x i1> undef)
	%V64 = call i1 @llvm.vector.reduce.umin.v64i1(<64 x i1> undef)			%V64 = call i1 @llvm.vector.reduce.umin.v64i1(<64 x i1> undef)
	%V128 = call i1 @llvm.vector.reduce.umin.v128i1(<128 x i1> undef)			%V128 = call i1 @llvm.vector.reduce.umin.v128i1(<128 x i1> undef)
	ret i32 undef			ret i32 undef
	}			}

	define i32 @reduce_umin_i8(i32 %arg) {			define i32 @reduce_umin_i8(i32 %arg) {
	; CHECK-LABEL: 'reduce_umin_i8'			; CHECK-LABEL: 'reduce_umin_i8'
	; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i8 @llvm.vector.reduce.umin.v1i8(<1 x i8> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i8 @llvm.vector.reduce.umin.v1i8(<1 x i8> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i8 @llvm.vector.reduce.umin.v2i8(<2 x i8> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i8 @llvm.vector.reduce.umin.v2i8(<2 x i8> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i8 @llvm.vector.reduce.umin.v4i8(<4 x i8> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i8 @llvm.vector.reduce.umin.v4i8(<4 x i8> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i8 @llvm.vector.reduce.umin.v8i8(<8 x i8> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i8 @llvm.vector.reduce.umin.v8i8(<8 x i8> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i8 @llvm.vector.reduce.umin.v16i8(<16 x i8> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i8 @llvm.vector.reduce.umin.v16i8(<16 x i8> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i8 @llvm.vector.reduce.umin.v32i8(<32 x i8> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i8 @llvm.vector.reduce.umin.v32i8(<32 x i8> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V64 = call i8 @llvm.vector.reduce.umin.v64i8(<64 x i8> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V64 = call i8 @llvm.vector.reduce.umin.v64i8(<64 x i8> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %V128 = call i8 @llvm.vector.reduce.umin.v128i8(<128 x i8> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %V128 = call i8 @llvm.vector.reduce.umin.v128i8(<128 x i8> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef			; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef
				;
	%V1 = call i8 @llvm.vector.reduce.umin.v1i8(<1 x i8> undef)			%V1 = call i8 @llvm.vector.reduce.umin.v1i8(<1 x i8> undef)
	%V2 = call i8 @llvm.vector.reduce.umin.v2i8(<2 x i8> undef)			%V2 = call i8 @llvm.vector.reduce.umin.v2i8(<2 x i8> undef)
	%V4 = call i8 @llvm.vector.reduce.umin.v4i8(<4 x i8> undef)			%V4 = call i8 @llvm.vector.reduce.umin.v4i8(<4 x i8> undef)
	%V8 = call i8 @llvm.vector.reduce.umin.v8i8(<8 x i8> undef)			%V8 = call i8 @llvm.vector.reduce.umin.v8i8(<8 x i8> undef)
	%V16 = call i8 @llvm.vector.reduce.umin.v16i8(<16 x i8> undef)			%V16 = call i8 @llvm.vector.reduce.umin.v16i8(<16 x i8> undef)
	%V32 = call i8 @llvm.vector.reduce.umin.v32i8(<32 x i8> undef)			%V32 = call i8 @llvm.vector.reduce.umin.v32i8(<32 x i8> undef)
	%V64 = call i8 @llvm.vector.reduce.umin.v64i8(<64 x i8> undef)			%V64 = call i8 @llvm.vector.reduce.umin.v64i8(<64 x i8> undef)
	%V128 = call i8 @llvm.vector.reduce.umin.v128i8(<128 x i8> undef)			%V128 = call i8 @llvm.vector.reduce.umin.v128i8(<128 x i8> undef)
	ret i32 undef			ret i32 undef
	}			}

	define i32 @reduce_umin_i16(i32 %arg) {			define i32 @reduce_umin_i16(i32 %arg) {
	; CHECK-LABEL: 'reduce_umin_i16'			; CHECK-LABEL: 'reduce_umin_i16'
	; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i16 @llvm.vector.reduce.umin.v1i16(<1 x i16> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i16 @llvm.vector.reduce.umin.v1i16(<1 x i16> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i16 @llvm.vector.reduce.umin.v2i16(<2 x i16> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i16 @llvm.vector.reduce.umin.v2i16(<2 x i16> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i16 @llvm.vector.reduce.umin.v4i16(<4 x i16> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i16 @llvm.vector.reduce.umin.v4i16(<4 x i16> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i16 @llvm.vector.reduce.umin.v8i16(<8 x i16> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i16 @llvm.vector.reduce.umin.v8i16(<8 x i16> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i16 @llvm.vector.reduce.umin.v16i16(<16 x i16> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i16 @llvm.vector.reduce.umin.v16i16(<16 x i16> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i16 @llvm.vector.reduce.umin.v32i16(<32 x i16> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i16 @llvm.vector.reduce.umin.v32i16(<32 x i16> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V64 = call i16 @llvm.vector.reduce.umin.v64i16(<64 x i16> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V64 = call i16 @llvm.vector.reduce.umin.v64i16(<64 x i16> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %V128 = call i16 @llvm.vector.reduce.umin.v128i16(<128 x i16> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %V128 = call i16 @llvm.vector.reduce.umin.v128i16(<128 x i16> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef			; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef
				;
	%V1 = call i16 @llvm.vector.reduce.umin.v1i16(<1 x i16> undef)			%V1 = call i16 @llvm.vector.reduce.umin.v1i16(<1 x i16> undef)
	%V2 = call i16 @llvm.vector.reduce.umin.v2i16(<2 x i16> undef)			%V2 = call i16 @llvm.vector.reduce.umin.v2i16(<2 x i16> undef)
	%V4 = call i16 @llvm.vector.reduce.umin.v4i16(<4 x i16> undef)			%V4 = call i16 @llvm.vector.reduce.umin.v4i16(<4 x i16> undef)
	%V8 = call i16 @llvm.vector.reduce.umin.v8i16(<8 x i16> undef)			%V8 = call i16 @llvm.vector.reduce.umin.v8i16(<8 x i16> undef)
	%V16 = call i16 @llvm.vector.reduce.umin.v16i16(<16 x i16> undef)			%V16 = call i16 @llvm.vector.reduce.umin.v16i16(<16 x i16> undef)
	%V32 = call i16 @llvm.vector.reduce.umin.v32i16(<32 x i16> undef)			%V32 = call i16 @llvm.vector.reduce.umin.v32i16(<32 x i16> undef)
	%V64 = call i16 @llvm.vector.reduce.umin.v64i16(<64 x i16> undef)			%V64 = call i16 @llvm.vector.reduce.umin.v64i16(<64 x i16> undef)
	%V128 = call i16 @llvm.vector.reduce.umin.v128i16(<128 x i16> undef)			%V128 = call i16 @llvm.vector.reduce.umin.v128i16(<128 x i16> undef)
	ret i32 undef			ret i32 undef
	}			}

	define i32 @reduce_umin_i32(i32 %arg) {			define i32 @reduce_umin_i32(i32 %arg) {
	; CHECK-LABEL: 'reduce_umin_i32'			; CHECK-LABEL: 'reduce_umin_i32'
	; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i32 @llvm.vector.reduce.umin.v1i32(<1 x i32> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i32 @llvm.vector.reduce.umin.v1i32(<1 x i32> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i32 @llvm.vector.reduce.umin.v2i32(<2 x i32> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i32 @llvm.vector.reduce.umin.v2i32(<2 x i32> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i32 @llvm.vector.reduce.umin.v4i32(<4 x i32> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i32 @llvm.vector.reduce.umin.v4i32(<4 x i32> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i32 @llvm.vector.reduce.umin.v8i32(<8 x i32> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i32 @llvm.vector.reduce.umin.v8i32(<8 x i32> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i32 @llvm.vector.reduce.umin.v16i32(<16 x i32> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i32 @llvm.vector.reduce.umin.v16i32(<16 x i32> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i32 @llvm.vector.reduce.umin.v32i32(<32 x i32> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i32 @llvm.vector.reduce.umin.v32i32(<32 x i32> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V64 = call i32 @llvm.vector.reduce.umin.v64i32(<64 x i32> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V64 = call i32 @llvm.vector.reduce.umin.v64i32(<64 x i32> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 10 for instruction: %V128 = call i32 @llvm.vector.reduce.umin.v128i32(<128 x i32> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 10 for instruction: %V128 = call i32 @llvm.vector.reduce.umin.v128i32(<128 x i32> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef			; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef
				;
	%V1 = call i32 @llvm.vector.reduce.umin.v1i32(<1 x i32> undef)			%V1 = call i32 @llvm.vector.reduce.umin.v1i32(<1 x i32> undef)
	%V2 = call i32 @llvm.vector.reduce.umin.v2i32(<2 x i32> undef)			%V2 = call i32 @llvm.vector.reduce.umin.v2i32(<2 x i32> undef)
	%V4 = call i32 @llvm.vector.reduce.umin.v4i32(<4 x i32> undef)			%V4 = call i32 @llvm.vector.reduce.umin.v4i32(<4 x i32> undef)
	%V8 = call i32 @llvm.vector.reduce.umin.v8i32(<8 x i32> undef)			%V8 = call i32 @llvm.vector.reduce.umin.v8i32(<8 x i32> undef)
	%V16 = call i32 @llvm.vector.reduce.umin.v16i32(<16 x i32> undef)			%V16 = call i32 @llvm.vector.reduce.umin.v16i32(<16 x i32> undef)
	%V32 = call i32 @llvm.vector.reduce.umin.v32i32(<32 x i32> undef)			%V32 = call i32 @llvm.vector.reduce.umin.v32i32(<32 x i32> undef)
	%V64 = call i32 @llvm.vector.reduce.umin.v64i32(<64 x i32> undef)			%V64 = call i32 @llvm.vector.reduce.umin.v64i32(<64 x i32> undef)
	%V128 = call i32 @llvm.vector.reduce.umin.v128i32(<128 x i32> undef)			%V128 = call i32 @llvm.vector.reduce.umin.v128i32(<128 x i32> undef)
	ret i32 undef			ret i32 undef
	}			}

	define i32 @reduce_umin_i64(i32 %arg) {			define i32 @reduce_umin_i64(i32 %arg) {
	; CHECK-LABEL: 'reduce_umin_i64'			; CHECK-LABEL: 'reduce_umin_i64'
	; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i64 @llvm.vector.reduce.umin.v1i64(<1 x i64> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i64 @llvm.vector.reduce.umin.v1i64(<1 x i64> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i64 @llvm.vector.reduce.umin.v2i64(<2 x i64> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i64 @llvm.vector.reduce.umin.v2i64(<2 x i64> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i64 @llvm.vector.reduce.umin.v4i64(<4 x i64> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i64 @llvm.vector.reduce.umin.v4i64(<4 x i64> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i64 @llvm.vector.reduce.umin.v8i64(<8 x i64> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i64 @llvm.vector.reduce.umin.v8i64(<8 x i64> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i64 @llvm.vector.reduce.umin.v16i64(<16 x i64> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i64 @llvm.vector.reduce.umin.v16i64(<16 x i64> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i64 @llvm.vector.reduce.umin.v32i64(<32 x i64> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i64 @llvm.vector.reduce.umin.v32i64(<32 x i64> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %V64 = call i64 @llvm.vector.reduce.umin.v64i64(<64 x i64> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %V64 = call i64 @llvm.vector.reduce.umin.v64i64(<64 x i64> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 12 for instruction: %V128 = call i64 @llvm.vector.reduce.umin.v128i64(<128 x i64> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 12 for instruction: %V128 = call i64 @llvm.vector.reduce.umin.v128i64(<128 x i64> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef			; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef
				;
	%V1 = call i64 @llvm.vector.reduce.umin.v1i64(<1 x i64> undef)			%V1 = call i64 @llvm.vector.reduce.umin.v1i64(<1 x i64> undef)
	%V2 = call i64 @llvm.vector.reduce.umin.v2i64(<2 x i64> undef)			%V2 = call i64 @llvm.vector.reduce.umin.v2i64(<2 x i64> undef)
	%V4 = call i64 @llvm.vector.reduce.umin.v4i64(<4 x i64> undef)			%V4 = call i64 @llvm.vector.reduce.umin.v4i64(<4 x i64> undef)
	%V8 = call i64 @llvm.vector.reduce.umin.v8i64(<8 x i64> undef)			%V8 = call i64 @llvm.vector.reduce.umin.v8i64(<8 x i64> undef)
	%V16 = call i64 @llvm.vector.reduce.umin.v16i64(<16 x i64> undef)			%V16 = call i64 @llvm.vector.reduce.umin.v16i64(<16 x i64> undef)
	%V32 = call i64 @llvm.vector.reduce.umin.v32i64(<32 x i64> undef)			%V32 = call i64 @llvm.vector.reduce.umin.v32i64(<32 x i64> undef)
	%V64 = call i64 @llvm.vector.reduce.umin.v64i64(<64 x i64> undef)			%V64 = call i64 @llvm.vector.reduce.umin.v64i64(<64 x i64> undef)
	%V128 = call i64 @llvm.vector.reduce.umin.v128i64(<128 x i64> undef)			%V128 = call i64 @llvm.vector.reduce.umin.v128i64(<128 x i64> undef)
	ret i32 undef			ret i32 undef
	}			}

	define i32 @reduce_smin_i1(i32 %arg) {			define i32 @reduce_smin_i1(i32 %arg) {
	; CHECK-LABEL: 'reduce_smin_i1'			; CHECK-LABEL: 'reduce_smin_i1'
	; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i1 @llvm.vector.reduce.smin.v1i1(<1 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V1 = call i1 @llvm.vector.reduce.smin.v1i1(<1 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i1 @llvm.vector.reduce.smin.v2i1(<2 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i1 @llvm.vector.reduce.smin.v2i1(<2 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i1 @llvm.vector.reduce.smin.v4i1(<4 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V4 = call i1 @llvm.vector.reduce.smin.v4i1(<4 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i1 @llvm.vector.reduce.smin.v8i1(<8 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V8 = call i1 @llvm.vector.reduce.smin.v8i1(<8 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i1 @llvm.vector.reduce.smin.v16i1(<16 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V16 = call i1 @llvm.vector.reduce.smin.v16i1(<16 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i1 @llvm.vector.reduce.smin.v32i1(<32 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V32 = call i1 @llvm.vector.reduce.smin.v32i1(<32 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V64 = call i1 @llvm.vector.reduce.smin.v64i1(<64 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V64 = call i1 @llvm.vector.reduce.smin.v64i1(<64 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %V128 = call i1 @llvm.vector.reduce.smin.v128i1(<128 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V128 = call i1 @llvm.vector.reduce.smin.v128i1(<128 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef			; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef
				;
	%V1 = call i1 @llvm.vector.reduce.smin.v1i1(<1 x i1> undef)			%V1 = call i1 @llvm.vector.reduce.smin.v1i1(<1 x i1> undef)
	%V2 = call i1 @llvm.vector.reduce.smin.v2i1(<2 x i1> undef)			%V2 = call i1 @llvm.vector.reduce.smin.v2i1(<2 x i1> undef)
	%V4 = call i1 @llvm.vector.reduce.smin.v4i1(<4 x i1> undef)			%V4 = call i1 @llvm.vector.reduce.smin.v4i1(<4 x i1> undef)
	%V8 = call i1 @llvm.vector.reduce.smin.v8i1(<8 x i1> undef)			%V8 = call i1 @llvm.vector.reduce.smin.v8i1(<8 x i1> undef)
	%V16 = call i1 @llvm.vector.reduce.smin.v16i1(<16 x i1> undef)			%V16 = call i1 @llvm.vector.reduce.smin.v16i1(<16 x i1> undef)
	%V32 = call i1 @llvm.vector.reduce.smin.v32i1(<32 x i1> undef)			%V32 = call i1 @llvm.vector.reduce.smin.v32i1(<32 x i1> undef)
	%V64 = call i1 @llvm.vector.reduce.smin.v64i1(<64 x i1> undef)			%V64 = call i1 @llvm.vector.reduce.smin.v64i1(<64 x i1> undef)
	%V128 = call i1 @llvm.vector.reduce.smin.v128i1(<128 x i1> undef)			%V128 = call i1 @llvm.vector.reduce.smin.v128i1(<128 x i1> undef)
	ret i32 undef			ret i32 undef
	}			}

	define i32 @reduce_smin_i8(i32 %arg) {			define i32 @reduce_smin_i8(i32 %arg) {
	; CHECK-LABEL: 'reduce_smin_i8'			; CHECK-LABEL: 'reduce_smin_i8'
	; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i8 @llvm.vector.reduce.smin.v1i8(<1 x i8> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i8 @llvm.vector.reduce.smin.v1i8(<1 x i8> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i8 @llvm.vector.reduce.smin.v2i8(<2 x i8> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i8 @llvm.vector.reduce.smin.v2i8(<2 x i8> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i8 @llvm.vector.reduce.smin.v4i8(<4 x i8> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i8 @llvm.vector.reduce.smin.v4i8(<4 x i8> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i8 @llvm.vector.reduce.smin.v8i8(<8 x i8> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i8 @llvm.vector.reduce.smin.v8i8(<8 x i8> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i8 @llvm.vector.reduce.smin.v16i8(<16 x i8> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i8 @llvm.vector.reduce.smin.v16i8(<16 x i8> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i8 @llvm.vector.reduce.smin.v32i8(<32 x i8> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i8 @llvm.vector.reduce.smin.v32i8(<32 x i8> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V64 = call i8 @llvm.vector.reduce.smin.v64i8(<64 x i8> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V64 = call i8 @llvm.vector.reduce.smin.v64i8(<64 x i8> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %V128 = call i8 @llvm.vector.reduce.smin.v128i8(<128 x i8> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %V128 = call i8 @llvm.vector.reduce.smin.v128i8(<128 x i8> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef			; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef
				;
	%V1 = call i8 @llvm.vector.reduce.smin.v1i8(<1 x i8> undef)			%V1 = call i8 @llvm.vector.reduce.smin.v1i8(<1 x i8> undef)
	%V2 = call i8 @llvm.vector.reduce.smin.v2i8(<2 x i8> undef)			%V2 = call i8 @llvm.vector.reduce.smin.v2i8(<2 x i8> undef)
	%V4 = call i8 @llvm.vector.reduce.smin.v4i8(<4 x i8> undef)			%V4 = call i8 @llvm.vector.reduce.smin.v4i8(<4 x i8> undef)
	%V8 = call i8 @llvm.vector.reduce.smin.v8i8(<8 x i8> undef)			%V8 = call i8 @llvm.vector.reduce.smin.v8i8(<8 x i8> undef)
	%V16 = call i8 @llvm.vector.reduce.smin.v16i8(<16 x i8> undef)			%V16 = call i8 @llvm.vector.reduce.smin.v16i8(<16 x i8> undef)
	%V32 = call i8 @llvm.vector.reduce.smin.v32i8(<32 x i8> undef)			%V32 = call i8 @llvm.vector.reduce.smin.v32i8(<32 x i8> undef)
	%V64 = call i8 @llvm.vector.reduce.smin.v64i8(<64 x i8> undef)			%V64 = call i8 @llvm.vector.reduce.smin.v64i8(<64 x i8> undef)
	%V128 = call i8 @llvm.vector.reduce.smin.v128i8(<128 x i8> undef)			%V128 = call i8 @llvm.vector.reduce.smin.v128i8(<128 x i8> undef)
	ret i32 undef			ret i32 undef
	}			}

	define i32 @reduce_smin_i16(i32 %arg) {			define i32 @reduce_smin_i16(i32 %arg) {
	; CHECK-LABEL: 'reduce_smin_i16'			; CHECK-LABEL: 'reduce_smin_i16'
	; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i16 @llvm.vector.reduce.smin.v1i16(<1 x i16> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i16 @llvm.vector.reduce.smin.v1i16(<1 x i16> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i16 @llvm.vector.reduce.smin.v2i16(<2 x i16> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i16 @llvm.vector.reduce.smin.v2i16(<2 x i16> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i16 @llvm.vector.reduce.smin.v4i16(<4 x i16> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i16 @llvm.vector.reduce.smin.v4i16(<4 x i16> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i16 @llvm.vector.reduce.smin.v8i16(<8 x i16> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i16 @llvm.vector.reduce.smin.v8i16(<8 x i16> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i16 @llvm.vector.reduce.smin.v16i16(<16 x i16> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i16 @llvm.vector.reduce.smin.v16i16(<16 x i16> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i16 @llvm.vector.reduce.smin.v32i16(<32 x i16> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i16 @llvm.vector.reduce.smin.v32i16(<32 x i16> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V64 = call i16 @llvm.vector.reduce.smin.v64i16(<64 x i16> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V64 = call i16 @llvm.vector.reduce.smin.v64i16(<64 x i16> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %V128 = call i16 @llvm.vector.reduce.smin.v128i16(<128 x i16> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %V128 = call i16 @llvm.vector.reduce.smin.v128i16(<128 x i16> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef			; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef
				;
	%V1 = call i16 @llvm.vector.reduce.smin.v1i16(<1 x i16> undef)			%V1 = call i16 @llvm.vector.reduce.smin.v1i16(<1 x i16> undef)
	%V2 = call i16 @llvm.vector.reduce.smin.v2i16(<2 x i16> undef)			%V2 = call i16 @llvm.vector.reduce.smin.v2i16(<2 x i16> undef)
	%V4 = call i16 @llvm.vector.reduce.smin.v4i16(<4 x i16> undef)			%V4 = call i16 @llvm.vector.reduce.smin.v4i16(<4 x i16> undef)
	%V8 = call i16 @llvm.vector.reduce.smin.v8i16(<8 x i16> undef)			%V8 = call i16 @llvm.vector.reduce.smin.v8i16(<8 x i16> undef)
	%V16 = call i16 @llvm.vector.reduce.smin.v16i16(<16 x i16> undef)			%V16 = call i16 @llvm.vector.reduce.smin.v16i16(<16 x i16> undef)
	%V32 = call i16 @llvm.vector.reduce.smin.v32i16(<32 x i16> undef)			%V32 = call i16 @llvm.vector.reduce.smin.v32i16(<32 x i16> undef)
	%V64 = call i16 @llvm.vector.reduce.smin.v64i16(<64 x i16> undef)			%V64 = call i16 @llvm.vector.reduce.smin.v64i16(<64 x i16> undef)
	%V128 = call i16 @llvm.vector.reduce.smin.v128i16(<128 x i16> undef)			%V128 = call i16 @llvm.vector.reduce.smin.v128i16(<128 x i16> undef)
	ret i32 undef			ret i32 undef
	}			}

	define i32 @reduce_smin_i32(i32 %arg) {			define i32 @reduce_smin_i32(i32 %arg) {
	; CHECK-LABEL: 'reduce_smin_i32'			; CHECK-LABEL: 'reduce_smin_i32'
	; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i32 @llvm.vector.reduce.smin.v1i32(<1 x i32> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i32 @llvm.vector.reduce.smin.v1i32(<1 x i32> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i32 @llvm.vector.reduce.smin.v2i32(<2 x i32> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i32 @llvm.vector.reduce.smin.v2i32(<2 x i32> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i32 @llvm.vector.reduce.smin.v4i32(<4 x i32> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i32 @llvm.vector.reduce.smin.v4i32(<4 x i32> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i32 @llvm.vector.reduce.smin.v8i32(<8 x i32> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i32 @llvm.vector.reduce.smin.v8i32(<8 x i32> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i32 @llvm.vector.reduce.smin.v16i32(<16 x i32> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i32 @llvm.vector.reduce.smin.v16i32(<16 x i32> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i32 @llvm.vector.reduce.smin.v32i32(<32 x i32> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i32 @llvm.vector.reduce.smin.v32i32(<32 x i32> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V64 = call i32 @llvm.vector.reduce.smin.v64i32(<64 x i32> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %V64 = call i32 @llvm.vector.reduce.smin.v64i32(<64 x i32> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 10 for instruction: %V128 = call i32 @llvm.vector.reduce.smin.v128i32(<128 x i32> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 10 for instruction: %V128 = call i32 @llvm.vector.reduce.smin.v128i32(<128 x i32> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef			; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef
				;
	%V1 = call i32 @llvm.vector.reduce.smin.v1i32(<1 x i32> undef)			%V1 = call i32 @llvm.vector.reduce.smin.v1i32(<1 x i32> undef)
	%V2 = call i32 @llvm.vector.reduce.smin.v2i32(<2 x i32> undef)			%V2 = call i32 @llvm.vector.reduce.smin.v2i32(<2 x i32> undef)
	%V4 = call i32 @llvm.vector.reduce.smin.v4i32(<4 x i32> undef)			%V4 = call i32 @llvm.vector.reduce.smin.v4i32(<4 x i32> undef)
	%V8 = call i32 @llvm.vector.reduce.smin.v8i32(<8 x i32> undef)			%V8 = call i32 @llvm.vector.reduce.smin.v8i32(<8 x i32> undef)
	%V16 = call i32 @llvm.vector.reduce.smin.v16i32(<16 x i32> undef)			%V16 = call i32 @llvm.vector.reduce.smin.v16i32(<16 x i32> undef)
	%V32 = call i32 @llvm.vector.reduce.smin.v32i32(<32 x i32> undef)			%V32 = call i32 @llvm.vector.reduce.smin.v32i32(<32 x i32> undef)
	%V64 = call i32 @llvm.vector.reduce.smin.v64i32(<64 x i32> undef)			%V64 = call i32 @llvm.vector.reduce.smin.v64i32(<64 x i32> undef)
	%V128 = call i32 @llvm.vector.reduce.smin.v128i32(<128 x i32> undef)			%V128 = call i32 @llvm.vector.reduce.smin.v128i32(<128 x i32> undef)
	ret i32 undef			ret i32 undef
	}			}

	define i32 @reduce_smin_i64(i32 %arg) {			define i32 @reduce_smin_i64(i32 %arg) {
	; CHECK-LABEL: 'reduce_smin_i64'			; CHECK-LABEL: 'reduce_smin_i64'
	; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i64 @llvm.vector.reduce.smin.v1i64(<1 x i64> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i64 @llvm.vector.reduce.smin.v1i64(<1 x i64> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i64 @llvm.vector.reduce.smin.v2i64(<2 x i64> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i64 @llvm.vector.reduce.smin.v2i64(<2 x i64> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i64 @llvm.vector.reduce.smin.v4i64(<4 x i64> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %V4 = call i64 @llvm.vector.reduce.smin.v4i64(<4 x i64> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i64 @llvm.vector.reduce.smin.v8i64(<8 x i64> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V8 = call i64 @llvm.vector.reduce.smin.v8i64(<8 x i64> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i64 @llvm.vector.reduce.smin.v16i64(<16 x i64> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %V16 = call i64 @llvm.vector.reduce.smin.v16i64(<16 x i64> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i64 @llvm.vector.reduce.smin.v32i64(<32 x i64> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V32 = call i64 @llvm.vector.reduce.smin.v32i64(<32 x i64> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %V64 = call i64 @llvm.vector.reduce.smin.v64i64(<64 x i64> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %V64 = call i64 @llvm.vector.reduce.smin.v64i64(<64 x i64> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 12 for instruction: %V128 = call i64 @llvm.vector.reduce.smin.v128i64(<128 x i64> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 12 for instruction: %V128 = call i64 @llvm.vector.reduce.smin.v128i64(<128 x i64> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef			; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef
				;
	%V1 = call i64 @llvm.vector.reduce.smin.v1i64(<1 x i64> undef)			%V1 = call i64 @llvm.vector.reduce.smin.v1i64(<1 x i64> undef)
	%V2 = call i64 @llvm.vector.reduce.smin.v2i64(<2 x i64> undef)			%V2 = call i64 @llvm.vector.reduce.smin.v2i64(<2 x i64> undef)
	%V4 = call i64 @llvm.vector.reduce.smin.v4i64(<4 x i64> undef)			%V4 = call i64 @llvm.vector.reduce.smin.v4i64(<4 x i64> undef)
	%V8 = call i64 @llvm.vector.reduce.smin.v8i64(<8 x i64> undef)			%V8 = call i64 @llvm.vector.reduce.smin.v8i64(<8 x i64> undef)
	%V16 = call i64 @llvm.vector.reduce.smin.v16i64(<16 x i64> undef)			%V16 = call i64 @llvm.vector.reduce.smin.v16i64(<16 x i64> undef)
	%V32 = call i64 @llvm.vector.reduce.smin.v32i64(<32 x i64> undef)			%V32 = call i64 @llvm.vector.reduce.smin.v32i64(<32 x i64> undef)
	%V64 = call i64 @llvm.vector.reduce.smin.v64i64(<64 x i64> undef)			%V64 = call i64 @llvm.vector.reduce.smin.v64i64(<64 x i64> undef)
	%V128 = call i64 @llvm.vector.reduce.smin.v128i64(<128 x i64> undef)			%V128 = call i64 @llvm.vector.reduce.smin.v128i64(<128 x i64> undef)
	▲ Show 20 Lines • Show All 83 Lines • Show Last 20 Lines

llvm/test/Analysis/CostModel/RISCV/reduce-or.ll

	; NOTE: Assertions have been autogenerated by utils/update_analyze_test_checks.py			; NOTE: Assertions have been autogenerated by utils/update_analyze_test_checks.py
	; RUN: opt < %s -mtriple=riscv32 -mattr=+v -riscv-v-vector-bits-min=256 -passes='print<cost-model>' -cost-kind=throughput 2>&1 -disable-output \| FileCheck %s --check-prefixes=CHECK,RISCV32			; RUN: opt < %s -mtriple=riscv32 -mattr=+v -riscv-v-vector-bits-min=256 -passes='print<cost-model>' -cost-kind=throughput 2>&1 -disable-output \| FileCheck %s
	; RUN: opt < %s -mtriple=riscv64 -mattr=+v -riscv-v-vector-bits-min=256 -passes='print<cost-model>' -cost-kind=throughput 2>&1 -disable-output \| FileCheck %s --check-prefixes=CHECK,RISCV64			; RUN: opt < %s -mtriple=riscv64 -mattr=+v -riscv-v-vector-bits-min=256 -passes='print<cost-model>' -cost-kind=throughput 2>&1 -disable-output \| FileCheck %s

	define i32 @reduce_i1(i32 %arg) {			define i32 @reduce_i1(i32 %arg) {
	; RISCV32-LABEL: 'reduce_i1'			; CHECK-LABEL: 'reduce_i1'
	; RISCV32-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %V1 = call i1 @llvm.vector.reduce.or.v1i1(<1 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i1 @llvm.vector.reduce.or.v1i1(<1 x i1> undef)
	; RISCV32-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i1 @llvm.vector.reduce.or.v2i1(<2 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V2 = call i1 @llvm.vector.reduce.or.v2i1(<2 x i1> undef)
	; RISCV32-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V4 = call i1 @llvm.vector.reduce.or.v4i1(<4 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V4 = call i1 @llvm.vector.reduce.or.v4i1(<4 x i1> undef)
	; RISCV32-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %V8 = call i1 @llvm.vector.reduce.or.v8i1(<8 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V8 = call i1 @llvm.vector.reduce.or.v8i1(<8 x i1> undef)
	; RISCV32-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %V16 = call i1 @llvm.vector.reduce.or.v16i1(<16 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V16 = call i1 @llvm.vector.reduce.or.v16i1(<16 x i1> undef)
	; RISCV32-NEXT: Cost Model: Found an estimated cost of 33 for instruction: %V32 = call i1 @llvm.vector.reduce.or.v32i1(<32 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V32 = call i1 @llvm.vector.reduce.or.v32i1(<32 x i1> undef)
	; RISCV32-NEXT: Cost Model: Found an estimated cost of 66 for instruction: %V64 = call i1 @llvm.vector.reduce.or.v64i1(<64 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V64 = call i1 @llvm.vector.reduce.or.v64i1(<64 x i1> undef)
	; RISCV32-NEXT: Cost Model: Found an estimated cost of 132 for instruction: %V128 = call i1 @llvm.vector.reduce.or.v128i1(<128 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V128 = call i1 @llvm.vector.reduce.or.v128i1(<128 x i1> undef)
	; RISCV32-NEXT: Cost Model: Found an estimated cost of 264 for instruction: %V256 = call i1 @llvm.vector.reduce.or.v256i1(<256 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V256 = call i1 @llvm.vector.reduce.or.v256i1(<256 x i1> undef)
	; RISCV32-NEXT: Cost Model: Found an estimated cost of 528 for instruction: %V512 = call i1 @llvm.vector.reduce.or.v512i1(<512 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V512 = call i1 @llvm.vector.reduce.or.v512i1(<512 x i1> undef)
	; RISCV32-NEXT: Cost Model: Found an estimated cost of 1056 for instruction: %V1024 = call i1 @llvm.vector.reduce.or.v1024i1(<1024 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V1024 = call i1 @llvm.vector.reduce.or.v1024i1(<1024 x i1> undef)
	; RISCV32-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef			; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef
	;
	; RISCV64-LABEL: 'reduce_i1'
	; RISCV64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %V1 = call i1 @llvm.vector.reduce.or.v1i1(<1 x i1> undef)
	; RISCV64-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %V2 = call i1 @llvm.vector.reduce.or.v2i1(<2 x i1> undef)
	; RISCV64-NEXT: Cost Model: Found an estimated cost of 5 for instruction: %V4 = call i1 @llvm.vector.reduce.or.v4i1(<4 x i1> undef)
	; RISCV64-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %V8 = call i1 @llvm.vector.reduce.or.v8i1(<8 x i1> undef)
	; RISCV64-NEXT: Cost Model: Found an estimated cost of 17 for instruction: %V16 = call i1 @llvm.vector.reduce.or.v16i1(<16 x i1> undef)
	; RISCV64-NEXT: Cost Model: Found an estimated cost of 33 for instruction: %V32 = call i1 @llvm.vector.reduce.or.v32i1(<32 x i1> undef)
	; RISCV64-NEXT: Cost Model: Found an estimated cost of 65 for instruction: %V64 = call i1 @llvm.vector.reduce.or.v64i1(<64 x i1> undef)
	; RISCV64-NEXT: Cost Model: Found an estimated cost of 130 for instruction: %V128 = call i1 @llvm.vector.reduce.or.v128i1(<128 x i1> undef)
	; RISCV64-NEXT: Cost Model: Found an estimated cost of 260 for instruction: %V256 = call i1 @llvm.vector.reduce.or.v256i1(<256 x i1> undef)
	; RISCV64-NEXT: Cost Model: Found an estimated cost of 520 for instruction: %V512 = call i1 @llvm.vector.reduce.or.v512i1(<512 x i1> undef)
	; RISCV64-NEXT: Cost Model: Found an estimated cost of 1040 for instruction: %V1024 = call i1 @llvm.vector.reduce.or.v1024i1(<1024 x i1> undef)
	; RISCV64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef
	;			;
	%V1 = call i1 @llvm.vector.reduce.or.v1i1(<1 x i1> undef)			%V1 = call i1 @llvm.vector.reduce.or.v1i1(<1 x i1> undef)
	%V2 = call i1 @llvm.vector.reduce.or.v2i1(<2 x i1> undef)			%V2 = call i1 @llvm.vector.reduce.or.v2i1(<2 x i1> undef)
	%V4 = call i1 @llvm.vector.reduce.or.v4i1(<4 x i1> undef)			%V4 = call i1 @llvm.vector.reduce.or.v4i1(<4 x i1> undef)
	%V8 = call i1 @llvm.vector.reduce.or.v8i1(<8 x i1> undef)			%V8 = call i1 @llvm.vector.reduce.or.v8i1(<8 x i1> undef)
	%V16 = call i1 @llvm.vector.reduce.or.v16i1(<16 x i1> undef)			%V16 = call i1 @llvm.vector.reduce.or.v16i1(<16 x i1> undef)
	%V32 = call i1 @llvm.vector.reduce.or.v32i1(<32 x i1> undef)			%V32 = call i1 @llvm.vector.reduce.or.v32i1(<32 x i1> undef)
	%V64 = call i1 @llvm.vector.reduce.or.v64i1(<64 x i1> undef)			%V64 = call i1 @llvm.vector.reduce.or.v64i1(<64 x i1> undef)
	▲ Show 20 Lines • Show All 142 Lines • Show Last 20 Lines

llvm/test/Analysis/CostModel/RISCV/reduce-xor.ll

	; NOTE: Assertions have been autogenerated by utils/update_analyze_test_checks.py			; NOTE: Assertions have been autogenerated by utils/update_analyze_test_checks.py
	; RUN: opt < %s -mtriple=riscv32 -mattr=+v -riscv-v-vector-bits-min=256 -passes='print<cost-model>' -cost-kind=throughput 2>&1 -disable-output \| FileCheck %s			; RUN: opt < %s -mtriple=riscv32 -mattr=+v -riscv-v-vector-bits-min=256 -passes='print<cost-model>' -cost-kind=throughput 2>&1 -disable-output \| FileCheck %s
	; RUN: opt < %s -mtriple=riscv64 -mattr=+v -riscv-v-vector-bits-min=256 -passes='print<cost-model>' -cost-kind=throughput 2>&1 -disable-output \| FileCheck %s			; RUN: opt < %s -mtriple=riscv64 -mattr=+v -riscv-v-vector-bits-min=256 -passes='print<cost-model>' -cost-kind=throughput 2>&1 -disable-output \| FileCheck %s

	define i32 @reduce_i1(i32 %arg) {			define i32 @reduce_i1(i32 %arg) {
	; CHECK-LABEL: 'reduce_i1'			; CHECK-LABEL: 'reduce_i1'
	; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %V1 = call i1 @llvm.vector.reduce.xor.v1i1(<1 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V1 = call i1 @llvm.vector.reduce.xor.v1i1(<1 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 7 for instruction: %V2 = call i1 @llvm.vector.reduce.xor.v2i1(<2 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V2 = call i1 @llvm.vector.reduce.xor.v2i1(<2 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 21 for instruction: %V4 = call i1 @llvm.vector.reduce.xor.v4i1(<4 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V4 = call i1 @llvm.vector.reduce.xor.v4i1(<4 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 55 for instruction: %V8 = call i1 @llvm.vector.reduce.xor.v8i1(<8 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V8 = call i1 @llvm.vector.reduce.xor.v8i1(<8 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 137 for instruction: %V16 = call i1 @llvm.vector.reduce.xor.v16i1(<16 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V16 = call i1 @llvm.vector.reduce.xor.v16i1(<16 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 331 for instruction: %V32 = call i1 @llvm.vector.reduce.xor.v32i1(<32 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V32 = call i1 @llvm.vector.reduce.xor.v32i1(<32 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 781 for instruction: %V64 = call i1 @llvm.vector.reduce.xor.v64i1(<64 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V64 = call i1 @llvm.vector.reduce.xor.v64i1(<64 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 1807 for instruction: %V128 = call i1 @llvm.vector.reduce.xor.v128i1(<128 x i1> undef)			; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %V128 = call i1 @llvm.vector.reduce.xor.v128i1(<128 x i1> undef)
	; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef			; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: ret i32 undef
	;			;
	%V1 = call i1 @llvm.vector.reduce.xor.v1i1(<1 x i1> undef)			%V1 = call i1 @llvm.vector.reduce.xor.v1i1(<1 x i1> undef)
	%V2 = call i1 @llvm.vector.reduce.xor.v2i1(<2 x i1> undef)			%V2 = call i1 @llvm.vector.reduce.xor.v2i1(<2 x i1> undef)
	%V4 = call i1 @llvm.vector.reduce.xor.v4i1(<4 x i1> undef)			%V4 = call i1 @llvm.vector.reduce.xor.v4i1(<4 x i1> undef)
	%V8 = call i1 @llvm.vector.reduce.xor.v8i1(<8 x i1> undef)			%V8 = call i1 @llvm.vector.reduce.xor.v8i1(<8 x i1> undef)
	%V16 = call i1 @llvm.vector.reduce.xor.v16i1(<16 x i1> undef)			%V16 = call i1 @llvm.vector.reduce.xor.v16i1(<16 x i1> undef)
	%V32 = call i1 @llvm.vector.reduce.xor.v32i1(<32 x i1> undef)			%V32 = call i1 @llvm.vector.reduce.xor.v32i1(<32 x i1> undef)
	▲ Show 20 Lines • Show All 137 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[RISCV] Refine costs for i1 reductions
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 436028

llvm/lib/Target/RISCV/RISCVTargetTransformInfo.cpp

llvm/test/Analysis/CostModel/RISCV/reduce-add.ll

llvm/test/Analysis/CostModel/RISCV/reduce-and.ll

llvm/test/Analysis/CostModel/RISCV/reduce-max.ll

llvm/test/Analysis/CostModel/RISCV/reduce-min.ll

llvm/test/Analysis/CostModel/RISCV/reduce-or.ll

llvm/test/Analysis/CostModel/RISCV/reduce-xor.ll

This is an archive of the discontinued LLVM Phabricator instance.

[RISCV] Refine costs for i1 reductionsClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 436028

llvm/lib/Target/RISCV/RISCVTargetTransformInfo.cpp

llvm/test/Analysis/CostModel/RISCV/reduce-add.ll

llvm/test/Analysis/CostModel/RISCV/reduce-and.ll

llvm/test/Analysis/CostModel/RISCV/reduce-max.ll

llvm/test/Analysis/CostModel/RISCV/reduce-min.ll

llvm/test/Analysis/CostModel/RISCV/reduce-or.ll

llvm/test/Analysis/CostModel/RISCV/reduce-xor.ll

[RISCV] Refine costs for i1 reductions
ClosedPublic