Diff 116005

include/llvm/Analysis/TargetTransformInfo.h

Show First 20 Lines • Show All 184 Lines • ▼ Show 20 Lines	public:
/// comments for a detailed explanation of the cost values.		/// comments for a detailed explanation of the cost values.
int getOperationCost(unsigned Opcode, Type Ty, Type OpTy = nullptr) const;		int getOperationCost(unsigned Opcode, Type Ty, Type OpTy = nullptr) const;

/// \brief Estimate the cost of a GEP operation when lowered.		/// \brief Estimate the cost of a GEP operation when lowered.
///		///
/// The contract for this function is the same as \c getOperationCost except		/// The contract for this function is the same as \c getOperationCost except
/// that it supports an interface that provides extra information specific to		/// that it supports an interface that provides extra information specific to
/// the GEP operation.		/// the GEP operation.
int getGEPCost(Type PointeeType, const Value Ptr,		int getGEPCost(const GEPOperator *GEP,
ArrayRef<const Value *> Operands) const;		ArrayRef<const Value *> Operands) const;

/// \brief Estimate the cost of a EXT operation when lowered.		/// \brief Estimate the cost of a EXT operation when lowered.
///		///
/// The contract for this function is the same as \c getOperationCost except		/// The contract for this function is the same as \c getOperationCost except
/// that it supports an interface that provides extra information specific to		/// that it supports an interface that provides extra information specific to
/// the EXT operation.		/// the EXT operation.
int getExtCost(const Instruction I, const Value Src) const;		int getExtCost(const Instruction I, const Value Src) const;
▲ Show 20 Lines • Show All 45 Lines • ▼ Show 20 Lines	public:
/// table.		/// table.
unsigned getEstimatedNumberOfCaseClusters(const SwitchInst &SI,		unsigned getEstimatedNumberOfCaseClusters(const SwitchInst &SI,
unsigned &JTSize) const;		unsigned &JTSize) const;

/// \brief Estimate the cost of a given IR user when lowered.		/// \brief Estimate the cost of a given IR user when lowered.
///		///
/// This can estimate the cost of either a ConstantExpr or Instruction when		/// This can estimate the cost of either a ConstantExpr or Instruction when
/// lowered. It has two primary advantages over the \c getOperationCost and		/// lowered. It has two primary advantages over the \c getOperationCost and
/// \c getGEPCost above, and one significant disadvantage: it can only be		/// \c getGEPCost above, and one significant disadvantage: it can only be
		hfinkelUnsubmitted Done Reply Inline Actions This comment would need to be updated. hfinkel: This comment would need to be updated.
/// used when the IR construct has already been formed.		/// used when the IR construct has already been formed.
///		///
/// The advantages are that it can inspect the SSA use graph to reason more		/// The advantages are that it can inspect the SSA use graph to reason more
/// accurately about the cost. For example, all-constant-GEPs can often be		/// accurately about the cost. For example, all-constant-GEPs can often be
/// folded into a load or other instruction, but if they are used in some		/// folded into a load or other instruction, but if they are used in some
/// other context they may not be folded. This routine can distinguish such		/// other context they may not be folded. This routine can distinguish such
/// cases.		/// cases.
///		///
▲ Show 20 Lines • Show All 661 Lines • ▼ Show 20 Lines	private:
std::unique_ptr<Concept> TTIImpl;		std::unique_ptr<Concept> TTIImpl;
};		};

class TargetTransformInfo::Concept {		class TargetTransformInfo::Concept {
public:		public:
virtual ~Concept() = 0;		virtual ~Concept() = 0;
virtual const DataLayout &getDataLayout() const = 0;		virtual const DataLayout &getDataLayout() const = 0;
virtual int getOperationCost(unsigned Opcode, Type Ty, Type OpTy) = 0;		virtual int getOperationCost(unsigned Opcode, Type Ty, Type OpTy) = 0;
virtual int getGEPCost(Type PointeeType, const Value Ptr,		virtual int getGEPCost(const GEPOperator *GEP,
ArrayRef<const Value *> Operands) = 0;		ArrayRef<const Value *> Operands) = 0;
virtual int getExtCost(const Instruction I, const Value Src) = 0;		virtual int getExtCost(const Instruction I, const Value Src) = 0;
virtual int getCallCost(FunctionType *FTy, int NumArgs) = 0;		virtual int getCallCost(FunctionType *FTy, int NumArgs) = 0;
virtual int getCallCost(const Function *F, int NumArgs) = 0;		virtual int getCallCost(const Function *F, int NumArgs) = 0;
virtual int getCallCost(const Function *F,		virtual int getCallCost(const Function *F,
ArrayRef<const Value *> Arguments) = 0;		ArrayRef<const Value *> Arguments) = 0;
virtual unsigned getInliningThresholdMultiplier() = 0;		virtual unsigned getInliningThresholdMultiplier() = 0;
virtual int getIntrinsicCost(Intrinsic::ID IID, Type *RetTy,		virtual int getIntrinsicCost(Intrinsic::ID IID, Type *RetTy,
▲ Show 20 Lines • Show All 162 Lines • ▼ Show 20 Lines	public:

const DataLayout &getDataLayout() const override {		const DataLayout &getDataLayout() const override {
return Impl.getDataLayout();		return Impl.getDataLayout();
}		}

int getOperationCost(unsigned Opcode, Type Ty, Type OpTy) override {		int getOperationCost(unsigned Opcode, Type Ty, Type OpTy) override {
return Impl.getOperationCost(Opcode, Ty, OpTy);		return Impl.getOperationCost(Opcode, Ty, OpTy);
}		}
int getGEPCost(Type PointeeType, const Value Ptr,		int getGEPCost(const GEPOperator *GEP,
ArrayRef<const Value *> Operands) override {		ArrayRef<const Value *> Operands) override {
return Impl.getGEPCost(PointeeType, Ptr, Operands);		return Impl.getGEPCost(GEP, Operands);
}		}
int getExtCost(const Instruction I, const Value Src) override {		int getExtCost(const Instruction I, const Value Src) override {
return Impl.getExtCost(I, Src);		return Impl.getExtCost(I, Src);
}		}
int getCallCost(FunctionType *FTy, int NumArgs) override {		int getCallCost(FunctionType *FTy, int NumArgs) override {
return Impl.getCallCost(FTy, NumArgs);		return Impl.getCallCost(FTy, NumArgs);
}		}
int getCallCost(const Function *F, int NumArgs) override {		int getCallCost(const Function *F, int NumArgs) override {
▲ Show 20 Lines • Show All 442 Lines • Show Last 20 Lines

include/llvm/Analysis/TargetTransformInfoImpl.h

Show First 20 Lines • Show All 46 Lines • ▼ Show 20 Lines	public:

unsigned getOperationCost(unsigned Opcode, Type Ty, Type OpTy) {		unsigned getOperationCost(unsigned Opcode, Type Ty, Type OpTy) {
switch (Opcode) {		switch (Opcode) {
default:		default:
// By default, just classify everything as 'basic'.		// By default, just classify everything as 'basic'.
return TTI::TCC_Basic;		return TTI::TCC_Basic;

case Instruction::GetElementPtr:		case Instruction::GetElementPtr:
llvm_unreachable("Use getGEPCost for GEP operations!");		llvm_unreachable("Use getGEPCost for GEP operations!");
		hfinkelUnsubmitted Not Done Reply Inline Actions This needs to be updated, or... At a high level, I'm not sure what we want to completely remove the version of the function that can be used without an existing function. Instead, we should add an overload, and then fall back to the existing code where relevant. hfinkel: This needs to be updated, or... At a high level, I'm not sure what we want to completely…
		junbumlAuthorUnsubmitted Not Done Reply Inline Actions I'm not perfectly clear about this. Do you think we should keep the existing getGEPCost as it is : int getGEPCost(Type PointeeType, const Value Ptr, ArrayRef<const Value > Operands), and add the new one : int getGEPCost(const GEPOperator GEP, ArrayRef<const Value > Operands) junbuml:* I'm not perfectly clear about this. Do you think we should keep the existing getGEPCost as it…
		hfinkelUnsubmitted Done Reply Inline Actions Yes. Then implement this new function so that it calls the instruction-independent version to handle the non-user-based logic. hfinkel: Yes. Then implement this new function so that it calls the instruction-independent version to…

case Instruction::BitCast:		case Instruction::BitCast:
assert(OpTy && "Cast instructions must provide the operand type");		assert(OpTy && "Cast instructions must provide the operand type");
if (Ty == OpTy \|\| (Ty->isPointerTy() && OpTy->isPointerTy()))		if (Ty == OpTy \|\| (Ty->isPointerTy() && OpTy->isPointerTy()))
// Identity and pointer-to-pointer casts are free.		// Identity and pointer-to-pointer casts are free.
return TTI::TCC_Free;		return TTI::TCC_Free;

// Otherwise, the default basic cost is used.		// Otherwise, the default basic cost is used.
Show All 34 Lines	case Instruction::Trunc:
// shift-right of the same width).		// shift-right of the same width).
if (DL.isLegalInteger(DL.getTypeSizeInBits(Ty)))		if (DL.isLegalInteger(DL.getTypeSizeInBits(Ty)))
return TTI::TCC_Free;		return TTI::TCC_Free;

return TTI::TCC_Basic;		return TTI::TCC_Basic;
}		}
}		}

int getGEPCost(Type PointeeType, const Value Ptr,		int getGEPCost(const GEPOperator GEP, ArrayRef<const Value > Operands) {
ArrayRef<const Value *> Operands) {
// In the basic model, we just assume that all-constant GEPs will be folded		// In the basic model, we just assume that all-constant GEPs will be folded
// into their uses via addressing modes.		// into their uses via addressing modes.
for (unsigned Idx = 0, Size = Operands.size(); Idx != Size; ++Idx)		for (unsigned Idx = 0, Size = Operands.size(); Idx != Size; ++Idx)
if (!isa<Constant>(Operands[Idx]))		if (!isa<Constant>(Operands[Idx]))
return TTI::TCC_Basic;		return TTI::TCC_Basic;

return TTI::TCC_Free;		return TTI::TCC_Free;
}		}
▲ Show 20 Lines • Show All 542 Lines • ▼ Show 20 Lines	unsigned getCallCost(const Function F, ArrayRef<const Value > Arguments) {
// Simply delegate to generic handling of the call.		// Simply delegate to generic handling of the call.
// FIXME: We should use instsimplify or something else to catch calls which		// FIXME: We should use instsimplify or something else to catch calls which
// will constant fold with these arguments.		// will constant fold with these arguments.
return static_cast<T *>(this)->getCallCost(F, Arguments.size());		return static_cast<T *>(this)->getCallCost(F, Arguments.size());
}		}

using BaseT::getGEPCost;		using BaseT::getGEPCost;

int getGEPCost(Type PointeeType, const Value Ptr,		int getGEPCost(const GEPOperator GEP, ArrayRef<const Value > Operands) {
ArrayRef<const Value *> Operands) {		Type *PointeeType = GEP->getSourceElementType();
		const Value *Ptr = GEP->getPointerOperand();

const GlobalValue *BaseGV = nullptr;		const GlobalValue *BaseGV = nullptr;
if (Ptr != nullptr) {		if (Ptr != nullptr) {
// TODO: will remove this when pointers have an opaque type.		// TODO: will remove this when pointers have an opaque type.
assert(Ptr->getType()->getScalarType()->getPointerElementType() ==		assert(Ptr->getType()->getScalarType()->getPointerElementType() ==
PointeeType &&		PointeeType &&
"explicit pointee type doesn't match operand's pointee type");		"explicit pointee type doesn't match operand's pointee type");
BaseGV = dyn_cast<GlobalValue>(Ptr->stripPointerCasts());		BaseGV = dyn_cast<GlobalValue>(Ptr->stripPointerCasts());
}		}
Show All 36 Lines	for (auto I = Operands.begin(); I != Operands.end(); ++I, ++GTI) {
}		}
}		}

// Assumes the address space is 0 when Ptr is nullptr.		// Assumes the address space is 0 when Ptr is nullptr.
unsigned AS =		unsigned AS =
(Ptr == nullptr ? 0 : Ptr->getType()->getPointerAddressSpace());		(Ptr == nullptr ? 0 : Ptr->getType()->getPointerAddressSpace());
if (static_cast<T *>(this)->isLegalAddressingMode(		if (static_cast<T *>(this)->isLegalAddressingMode(
TargetType, const_cast<GlobalValue *>(BaseGV), BaseOffset,		TargetType, const_cast<GlobalValue *>(BaseGV), BaseOffset,
HasBaseReg, Scale, AS))		HasBaseReg, Scale, AS)) {
		// Should check if the GEP is actually used in load / store instructions.
		// For simplicity, we check only direct users of the GEP.
		//
		// FIXME: GEPs could also be folded away as a part of addressing mode in
		// load/store instructions togetehr with other instructions (e.g., sext or
		// other GEPs). Handling all such cases must be expensive to be performed
		// in this function, so we stay conservative for now.
		for (const User *U : GEP->users()) {
		const Operator *UOP = cast<Operator>(U);
		const Value *PointerOperand = nullptr;
		if (auto *LI = dyn_cast<LoadInst>(UOP))
		PointerOperand = LI->getPointerOperand();
		else if (auto *SI = dyn_cast<StoreInst>(UOP))
		PointerOperand = SI->getPointerOperand();

		if ((!PointerOperand \|\| PointerOperand != GEP) &&
		!GEP->hasAllZeroIndices())
		return TTI::TCC_Basic;
		}
return TTI::TCC_Free;		return TTI::TCC_Free;
		}
return TTI::TCC_Basic;		return TTI::TCC_Basic;
}		}

using BaseT::getIntrinsicCost;		using BaseT::getIntrinsicCost;

unsigned getIntrinsicCost(Intrinsic::ID IID, Type *RetTy,		unsigned getIntrinsicCost(Intrinsic::ID IID, Type *RetTy,
ArrayRef<const Value *> Arguments) {		ArrayRef<const Value *> Arguments) {
// Delegate to the generic intrinsic handling code. This mostly provides an		// Delegate to the generic intrinsic handling code. This mostly provides an
// opportunity for targets to (for example) special case the cost of		// opportunity for targets to (for example) special case the cost of
// certain intrinsics based on constants used as arguments.		// certain intrinsics based on constants used as arguments.
SmallVector<Type *, 8> ParamTys;		SmallVector<Type *, 8> ParamTys;
ParamTys.reserve(Arguments.size());		ParamTys.reserve(Arguments.size());
for (unsigned Idx = 0, Size = Arguments.size(); Idx != Size; ++Idx)		for (unsigned Idx = 0, Size = Arguments.size(); Idx != Size; ++Idx)
		hfinkelUnsubmitted Done Reply Inline Actions togetehr -> together hfinkel: togetehr -> together
ParamTys.push_back(Arguments[Idx]->getType());		ParamTys.push_back(Arguments[Idx]->getType());
return static_cast<T *>(this)->getIntrinsicCost(IID, RetTy, ParamTys);		return static_cast<T *>(this)->getIntrinsicCost(IID, RetTy, ParamTys);
		hfinkelUnsubmitted Not Done Reply Inline Actions I don't understand this comment. If there's a sext/zext, then it would be an operand of the GEP, not the other way around, no? hfinkel: I don't understand this comment. If there's a sext/zext, then it would be an operand of the GEP…
		junbumlAuthorUnsubmitted Not Done Reply Inline Actions Yes, sext must be an operand of the GEP, not an user. Sorry for the confusion. Remove "sext" from the comment. junbuml: Yes, sext must be an operand of the GEP, not an user. Sorry for the confusion. Remove "sext"…
}		}

unsigned getUserCost(const User U, ArrayRef<const Value > Operands) {		unsigned getUserCost(const User U, ArrayRef<const Value > Operands) {
if (isa<PHINode>(U))		if (isa<PHINode>(U))
return TTI::TCC_Free; // Model all PHI nodes as free.		return TTI::TCC_Free; // Model all PHI nodes as free.

if (const GEPOperator *GEP = dyn_cast<GEPOperator>(U)) {		if (const GEPOperator *GEP = dyn_cast<GEPOperator>(U))
return static_cast<T *>(this)->getGEPCost(GEP->getSourceElementType(),		return static_cast<T *>(this)->getGEPCost(GEP,
GEP->getPointerOperand(),
Operands.drop_front());		Operands.drop_front());
}

if (auto CS = ImmutableCallSite(U)) {		if (auto CS = ImmutableCallSite(U)) {
const Function *F = CS.getCalledFunction();		const Function *F = CS.getCalledFunction();
if (!F) {		if (!F) {
// Just use the called value type.		// Just use the called value type.
Type *FTy = CS.getCalledValue()->getType()->getPointerElementType();		Type *FTy = CS.getCalledValue()->getType()->getPointerElementType();
return static_cast<T *>(this)		return static_cast<T *>(this)
->getCallCost(cast<FunctionType>(FTy), CS.arg_size());		->getCallCost(cast<FunctionType>(FTy), CS.arg_size());
▲ Show 20 Lines • Show All 43 Lines • Show Last 20 Lines

include/llvm/CodeGen/BasicTTIImpl.h

Show First 20 Lines • Show All 140 Lines • ▼ Show 20 Lines	bool isProfitableToHoist(Instruction *I) {
return getTLI()->isProfitableToHoist(I);		return getTLI()->isProfitableToHoist(I);
}		}

bool isTypeLegal(Type *Ty) {		bool isTypeLegal(Type *Ty) {
EVT VT = getTLI()->getValueType(DL, Ty);		EVT VT = getTLI()->getValueType(DL, Ty);
return getTLI()->isTypeLegal(VT);		return getTLI()->isTypeLegal(VT);
}		}

int getGEPCost(Type PointeeType, const Value Ptr,		int getGEPCost(const GEPOperator *GEP,
ArrayRef<const Value *> Operands) {		ArrayRef<const Value *> Operands) {
return BaseT::getGEPCost(PointeeType, Ptr, Operands);		return BaseT::getGEPCost(GEP, Operands);
}		}

int getExtCost(const Instruction I, const Value Src) {		int getExtCost(const Instruction I, const Value Src) {
if (getTLI()->isExtFree(I))		if (getTLI()->isExtFree(I))
return TargetTransformInfo::TCC_Free;		return TargetTransformInfo::TCC_Free;

if (isa<ZExtInst>(I) \|\| isa<SExtInst>(I))		if (isa<ZExtInst>(I) \|\| isa<SExtInst>(I))
if (const LoadInst *LI = dyn_cast<LoadInst>(Src))		if (const LoadInst *LI = dyn_cast<LoadInst>(Src))
▲ Show 20 Lines • Show All 1,100 Lines • Show Last 20 Lines

lib/Analysis/TargetTransformInfo.cpp

Show First 20 Lines • Show All 77 Lines • ▼ Show 20 Lines	int TargetTransformInfo::getCallCost(const Function *F,
assert(Cost >= 0 && "TTI should not produce negative costs!");		assert(Cost >= 0 && "TTI should not produce negative costs!");
return Cost;		return Cost;
}		}

unsigned TargetTransformInfo::getInliningThresholdMultiplier() const {		unsigned TargetTransformInfo::getInliningThresholdMultiplier() const {
return TTIImpl->getInliningThresholdMultiplier();		return TTIImpl->getInliningThresholdMultiplier();
}		}

int TargetTransformInfo::getGEPCost(Type PointeeType, const Value Ptr,		int TargetTransformInfo::getGEPCost(const GEPOperator *GEP,
ArrayRef<const Value *> Operands) const {		ArrayRef<const Value *> Operands) const {
return TTIImpl->getGEPCost(PointeeType, Ptr, Operands);		return TTIImpl->getGEPCost(GEP, Operands);
}		}

int TargetTransformInfo::getExtCost(const Instruction *I,		int TargetTransformInfo::getExtCost(const Instruction *I,
const Value *Src) const {		const Value *Src) const {
return TTIImpl->getExtCost(I, Src);		return TTIImpl->getExtCost(I, Src);
}		}

int TargetTransformInfo::getIntrinsicCost(		int TargetTransformInfo::getIntrinsicCost(
▲ Show 20 Lines • Show All 1,099 Lines • Show Last 20 Lines

lib/Transforms/Scalar/NaryReassociate.cpp

Show First 20 Lines • Show All 258 Lines • ▼ Show 20 Lines	Instruction NaryReassociatePass::tryReassociate(Instruction I) {
}		}
}		}

static bool isGEPFoldable(GetElementPtrInst *GEP,		static bool isGEPFoldable(GetElementPtrInst *GEP,
const TargetTransformInfo *TTI) {		const TargetTransformInfo *TTI) {
SmallVector<const Value*, 4> Indices;		SmallVector<const Value*, 4> Indices;
for (auto I = GEP->idx_begin(); I != GEP->idx_end(); ++I)		for (auto I = GEP->idx_begin(); I != GEP->idx_end(); ++I)
Indices.push_back(*I);		Indices.push_back(*I);
return TTI->getGEPCost(GEP->getSourceElementType(), GEP->getPointerOperand(),		return TTI->getGEPCost(cast<GEPOperator>(GEP),
Indices) == TargetTransformInfo::TCC_Free;		Indices) == TargetTransformInfo::TCC_Free;
}		}

Instruction NaryReassociatePass::tryReassociateGEP(GetElementPtrInst GEP) {		Instruction NaryReassociatePass::tryReassociateGEP(GetElementPtrInst GEP) {
// Not worth reassociating GEP if it is foldable.		// Not worth reassociating GEP if it is foldable.
if (isGEPFoldable(GEP, TTI))		if (isGEPFoldable(GEP, TTI))
return nullptr;		return nullptr;

▲ Show 20 Lines • Show All 234 Lines • Show Last 20 Lines

lib/Transforms/Scalar/StraightLineStrengthReduce.cpp

Show First 20 Lines • Show All 233 Lines • ▼ Show 20 Lines	return (Basis.Ins != C.Ins && // skip the same instruction
Basis.CandidateKind == C.CandidateKind);		Basis.CandidateKind == C.CandidateKind);
}		}

static bool isGEPFoldable(GetElementPtrInst *GEP,		static bool isGEPFoldable(GetElementPtrInst *GEP,
const TargetTransformInfo *TTI) {		const TargetTransformInfo *TTI) {
SmallVector<const Value*, 4> Indices;		SmallVector<const Value*, 4> Indices;
for (auto I = GEP->idx_begin(); I != GEP->idx_end(); ++I)		for (auto I = GEP->idx_begin(); I != GEP->idx_end(); ++I)
Indices.push_back(*I);		Indices.push_back(*I);
return TTI->getGEPCost(GEP->getSourceElementType(), GEP->getPointerOperand(),		return TTI->getGEPCost(cast<GEPOperator>(GEP),
Indices) == TargetTransformInfo::TCC_Free;		Indices) == TargetTransformInfo::TCC_Free;
}		}

// Returns whether (Base + Index * Stride) can be folded to an addressing mode.		// Returns whether (Base + Index * Stride) can be folded to an addressing mode.
static bool isAddFoldable(const SCEV Base, ConstantInt Index, Value *Stride,		static bool isAddFoldable(const SCEV Base, ConstantInt Index, Value *Stride,
TargetTransformInfo *TTI) {		TargetTransformInfo *TTI) {
// Index->getSExtValue() may crash if Index is wider than 64-bit.		// Index->getSExtValue() may crash if Index is wider than 64-bit.
return Index->getBitWidth() <= 64 &&		return Index->getBitWidth() <= 64 &&
▲ Show 20 Lines • Show All 451 Lines • Show Last 20 Lines

test/Analysis/CostModel/AArch64/gep.ll

	Show First 20 Lines • Show All 284 Lines • ▼ Show 20 Lines

	define i64 @test36(i64* %p) {			define i64 @test36(i64* %p) {
	; CHECK-LABEL: test36			; CHECK-LABEL: test36
	; CHECK: cost of 1 for instruction: {{.}} getelementptr inbounds i64, i64			; CHECK: cost of 1 for instruction: {{.}} getelementptr inbounds i64, i64
	%a = getelementptr inbounds i64, i64* %p, i32 -512			%a = getelementptr inbounds i64, i64* %p, i32 -512
	%v = load i64, i64* %a			%v = load i64, i64* %a
	ret i64 %v			ret i64 %v
	}			}

				; CHECK-LABEL: test37
				; CHECK: cost of 1 for instruction: {{.}} = getelementptr inbounds i8, i8**
				define i8 @test37(i64 %j, i8** readonly %P) {
				entry:
				%arrayidx0 = getelementptr inbounds i8, i8* %P, i64 %j
				%l1 = call i8* @func(i8** %arrayidx0)
				ret i8 0
				}

				; CHECK-LABEL: test38
				; CHECK: cost of 1 for instruction: {{.}} = getelementptr inbounds i8, i8**
				define i8 @test38(i8** readonly %P) {
				entry:
				%arrayidx0 = getelementptr inbounds i8, i8* %P, i64 10
				%l1 = call i8* @func(i8** %arrayidx0)
				ret i8 0
				}

				; CHECK-LABEL:test39
				; CHECK: cost of 0 for instruction: {{.}} = getelementptr inbounds i8, i8**
				define i8 @test39(i8** readonly %P) {
				entry:
				%arrayidx0 = getelementptr inbounds i8, i8* %P, i64 0
				%l1 = call i8* @func(i8** %arrayidx0)
				ret i8 0
				}

				; CHECK-LABEL:test40
				; CHECK: cost of 1 for instruction: {{.}} = getelementptr inbounds i8, i8**
				define i8 @test40(i8 readonly %P) {
				entry:
				%arrayidx0 = getelementptr inbounds i8, i8* %P, i64 10
				ret i8** %arrayidx0
				}

				; CHECK-LABEL:test41
				; CHECK: cost of 1 for instruction: {{.}} = getelementptr inbounds i8, i8
				define i8 @test41(i8* %V, i8** readonly %P) {
				entry:
				%arrayidx0 = getelementptr inbounds i8, i8* %V, i64 10
				store i8* %arrayidx0, i8** %P
				ret i8 0
				}

				declare i8* @func(i8**)

test/Analysis/CostModel/X86/vector_gep.ll

	; RUN: opt < %s -cost-model -analyze -mtriple=x86_64-linux-unknown-unknown -mattr=+avx512f \| FileCheck %s			; RUN: opt < %s -cost-model -analyze -mtriple=x86_64-linux-unknown-unknown -mattr=+avx512f \| FileCheck %s

	%struct.S = type { [1000 x i32] }			%struct.S = type { [1000 x i32] }


	declare <4 x i32> @llvm.masked.gather.v4i32.v4p0i32(<4 x i32*>, i32, <4 x i1>, <4 x i32>)			declare <4 x i32> @llvm.masked.gather.v4i32.v4p0i32(<4 x i32*>, i32, <4 x i1>, <4 x i32>)

	define <4 x i32> @foov(<4 x %struct.S*> %s, i64 %base){			define <4 x i32> @foov(<4 x %struct.S*> %s, i64 %base){
	%temp = insertelement <4 x i64> undef, i64 %base, i32 0			%temp = insertelement <4 x i64> undef, i64 %base, i32 0
	%vector = shufflevector <4 x i64> %temp, <4 x i64> undef, <4 x i32> zeroinitializer			%vector = shufflevector <4 x i64> %temp, <4 x i64> undef, <4 x i32> zeroinitializer
	;CHECK: cost of 0 for instruction: {{.*}} getelementptr inbounds %struct.S			;CHECK: cost of 1 for instruction: {{.*}} getelementptr inbounds %struct.S
				junbumlAuthorUnsubmitted Not Done Reply Inline Actions With this patch, %B is changed to a non-free because it's used in %arrayidx (non-memory operation). It might be possible to continue checking users of the non-memory operation users, but doing this completely must be expensive to be done in getGEPCost. It might be possible to add some simple exceptions, but in this patch I didn't add such checks. junbuml: With this patch, %B is changed to a non-free because it's used in %arrayidx (non-memory…
				efriedmaUnsubmitted Not Done Reply Inline Actions Yes, it should be fine to avoid folding together GEPs in getUserCost(). (Arguably, you might want to, but it could get complicated, so okay to skip that for now.) That said, there's something going wrong here. "gep %x, 0, 0" is free because it's just a type conversion. By the same reasoning, "gep %s, zeroinitializer, zeroinitializer" should also be free. efriedma: Yes, it should be fine to avoid folding together GEPs in getUserCost(). (Arguably, you might…
				junbumlAuthorUnsubmitted Not Done Reply Inline Actions We might be able to handle zeroinlitializer in hasAllZeroIndices() for ArrayType. Then, I think it should be a separate patch. junbuml: We might be able to handle zeroinlitializer in hasAllZeroIndices() for ArrayType. Then, I…
				hfinkelUnsubmitted Done Reply Inline Actions Why a separate patch? This patch is not overly complicated, and if there's a separate patch we'll have a regression in between. If you want to separate the patches, we should have them both before either is committed. But it sounds like a couple lines of code and a few lines of code for some tests. hfinkel: Why a separate patch? This patch is not overly complicated, and if there's a separate patch…
	%B = getelementptr inbounds %struct.S, <4 x %struct.S*> %s, <4 x i32> zeroinitializer, <4 x i32> zeroinitializer			%B = getelementptr inbounds %struct.S, <4 x %struct.S*> %s, <4 x i32> zeroinitializer, <4 x i32> zeroinitializer
	;CHECK: cost of 0 for instruction: {{.*}} getelementptr inbounds [1000 x i32]			;CHECK: cost of 1 for instruction: {{.*}} getelementptr inbounds [1000 x i32]
	%arrayidx = getelementptr inbounds [1000 x i32], <4 x [1000 x i32]*> %B, <4 x i64> zeroinitializer, <4 x i64> %vector			%arrayidx = getelementptr inbounds [1000 x i32], <4 x [1000 x i32]*> %B, <4 x i64> zeroinitializer, <4 x i64> %vector
	%res = call <4 x i32> @llvm.masked.gather.v4i32.v4p0i32(<4 x i32*> %arrayidx, i32 4, <4 x i1> <i1 true, i1 true, i1 true, i1 true>, <4 x i32> undef)			%res = call <4 x i32> @llvm.masked.gather.v4i32.v4p0i32(<4 x i32*> %arrayidx, i32 4, <4 x i1> <i1 true, i1 true, i1 true, i1 true>, <4 x i32> undef)
	ret <4 x i32> %res			ret <4 x i32> %res
	}			}

This is an archive of the discontinued LLVM Phabricator instance.

Use the basic cost if a GEP is not used as addressing mode
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 116005

include/llvm/Analysis/TargetTransformInfo.h

include/llvm/Analysis/TargetTransformInfoImpl.h

include/llvm/CodeGen/BasicTTIImpl.h

lib/Analysis/TargetTransformInfo.cpp

lib/Transforms/Scalar/NaryReassociate.cpp

lib/Transforms/Scalar/StraightLineStrengthReduce.cpp

test/Analysis/CostModel/AArch64/gep.ll

test/Analysis/CostModel/X86/vector_gep.ll

This is an archive of the discontinued LLVM Phabricator instance.

Use the basic cost if a GEP is not used as addressing modeClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 116005

include/llvm/Analysis/TargetTransformInfo.h

include/llvm/Analysis/TargetTransformInfoImpl.h

include/llvm/CodeGen/BasicTTIImpl.h

lib/Analysis/TargetTransformInfo.cpp

lib/Transforms/Scalar/NaryReassociate.cpp

lib/Transforms/Scalar/StraightLineStrengthReduce.cpp

test/Analysis/CostModel/AArch64/gep.ll

test/Analysis/CostModel/X86/vector_gep.ll

Use the basic cost if a GEP is not used as addressing mode
ClosedPublic