Diff 117572

include/llvm/Analysis/TargetTransformInfo.h

Show First 20 Lines • Show All 187 Lines • ▼ Show 20 Lines	public:
/// \brief Estimate the cost of a GEP operation when lowered.		/// \brief Estimate the cost of a GEP operation when lowered.
///		///
/// The contract for this function is the same as \c getOperationCost except		/// The contract for this function is the same as \c getOperationCost except
/// that it supports an interface that provides extra information specific to		/// that it supports an interface that provides extra information specific to
/// the GEP operation.		/// the GEP operation.
int getGEPCost(Type PointeeType, const Value Ptr,		int getGEPCost(Type PointeeType, const Value Ptr,
ArrayRef<const Value *> Operands) const;		ArrayRef<const Value *> Operands) const;

		/// \brief Estimate the cost of a GEP operation when lowered.
		///
		/// This user-based overload adds the ability to check if the GEP can be
		/// folded into its users.
		int getGEPCost(const GEPOperator *GEP,
		ArrayRef<const Value *> Operands) const;

/// \brief Estimate the cost of a EXT operation when lowered.		/// \brief Estimate the cost of a EXT operation when lowered.
///		///
/// The contract for this function is the same as \c getOperationCost except		/// The contract for this function is the same as \c getOperationCost except
/// that it supports an interface that provides extra information specific to		/// that it supports an interface that provides extra information specific to
/// the EXT operation.		/// the EXT operation.
int getExtCost(const Instruction I, const Value Src) const;		int getExtCost(const Instruction I, const Value Src) const;

/// \brief Estimate the cost of a function call when lowered.		/// \brief Estimate the cost of a function call when lowered.
▲ Show 20 Lines • Show All 41 Lines • ▼ Show 20 Lines	public:
/// \return The estimated number of case clusters when lowering \p 'SI'.		/// \return The estimated number of case clusters when lowering \p 'SI'.
/// \p JTSize Set a jump table size only when \p SI is suitable for a jump		/// \p JTSize Set a jump table size only when \p SI is suitable for a jump
/// table.		/// table.
unsigned getEstimatedNumberOfCaseClusters(const SwitchInst &SI,		unsigned getEstimatedNumberOfCaseClusters(const SwitchInst &SI,
unsigned &JTSize) const;		unsigned &JTSize) const;

/// \brief Estimate the cost of a given IR user when lowered.		/// \brief Estimate the cost of a given IR user when lowered.
///		///
/// This can estimate the cost of either a ConstantExpr or Instruction when		/// This can estimate the cost of either a ConstantExpr or Instruction when
/// lowered. It has two primary advantages over the \c getOperationCost and		/// lowered. It has two primary advantages over the \c getOperationCost above,
		hfinkelUnsubmitted Done Reply Inline Actions This comment would need to be updated. hfinkel: This comment would need to be updated.
/// \c getGEPCost above, and one significant disadvantage: it can only be		/// and one significant disadvantage: it can only be used when the IR
/// used when the IR construct has already been formed.		/// construct has already been formed.
///		///
/// The advantages are that it can inspect the SSA use graph to reason more		/// The advantages are that it can inspect the SSA use graph to reason more
/// accurately about the cost. For example, all-constant-GEPs can often be		/// accurately about the cost. For example, all-constant-GEPs can often be
/// folded into a load or other instruction, but if they are used in some		/// folded into a load or other instruction, but if they are used in some
/// other context they may not be folded. This routine can distinguish such		/// other context they may not be folded. This routine can distinguish such
/// cases.		/// cases.
///		///
/// \p Operands is a list of operands which can be a result of transformations		/// \p Operands is a list of operands which can be a result of transformations
▲ Show 20 Lines • Show All 662 Lines • ▼ Show 20 Lines

class TargetTransformInfo::Concept {		class TargetTransformInfo::Concept {
public:		public:
virtual ~Concept() = 0;		virtual ~Concept() = 0;
virtual const DataLayout &getDataLayout() const = 0;		virtual const DataLayout &getDataLayout() const = 0;
virtual int getOperationCost(unsigned Opcode, Type Ty, Type OpTy) = 0;		virtual int getOperationCost(unsigned Opcode, Type Ty, Type OpTy) = 0;
virtual int getGEPCost(Type PointeeType, const Value Ptr,		virtual int getGEPCost(Type PointeeType, const Value Ptr,
ArrayRef<const Value *> Operands) = 0;		ArrayRef<const Value *> Operands) = 0;
		virtual int getGEPCost(const GEPOperator *GEP,
		ArrayRef<const Value *> Operands) = 0;
virtual int getExtCost(const Instruction I, const Value Src) = 0;		virtual int getExtCost(const Instruction I, const Value Src) = 0;
virtual int getCallCost(FunctionType *FTy, int NumArgs) = 0;		virtual int getCallCost(FunctionType *FTy, int NumArgs) = 0;
virtual int getCallCost(const Function *F, int NumArgs) = 0;		virtual int getCallCost(const Function *F, int NumArgs) = 0;
virtual int getCallCost(const Function *F,		virtual int getCallCost(const Function *F,
ArrayRef<const Value *> Arguments) = 0;		ArrayRef<const Value *> Arguments) = 0;
virtual unsigned getInliningThresholdMultiplier() = 0;		virtual unsigned getInliningThresholdMultiplier() = 0;
virtual int getIntrinsicCost(Intrinsic::ID IID, Type *RetTy,		virtual int getIntrinsicCost(Intrinsic::ID IID, Type *RetTy,
ArrayRef<Type *> ParamTys) = 0;		ArrayRef<Type *> ParamTys) = 0;
▲ Show 20 Lines • Show All 165 Lines • ▼ Show 20 Lines	public:

int getOperationCost(unsigned Opcode, Type Ty, Type OpTy) override {		int getOperationCost(unsigned Opcode, Type Ty, Type OpTy) override {
return Impl.getOperationCost(Opcode, Ty, OpTy);		return Impl.getOperationCost(Opcode, Ty, OpTy);
}		}
int getGEPCost(Type PointeeType, const Value Ptr,		int getGEPCost(Type PointeeType, const Value Ptr,
ArrayRef<const Value *> Operands) override {		ArrayRef<const Value *> Operands) override {
return Impl.getGEPCost(PointeeType, Ptr, Operands);		return Impl.getGEPCost(PointeeType, Ptr, Operands);
}		}
		int getGEPCost(const GEPOperator *GEP,
		ArrayRef<const Value *> Operands) override {
		return Impl.getGEPCost(GEP, Operands);
		}
int getExtCost(const Instruction I, const Value Src) override {		int getExtCost(const Instruction I, const Value Src) override {
return Impl.getExtCost(I, Src);		return Impl.getExtCost(I, Src);
}		}
int getCallCost(FunctionType *FTy, int NumArgs) override {		int getCallCost(FunctionType *FTy, int NumArgs) override {
return Impl.getCallCost(FTy, NumArgs);		return Impl.getCallCost(FTy, NumArgs);
}		}
int getCallCost(const Function *F, int NumArgs) override {		int getCallCost(const Function *F, int NumArgs) override {
return Impl.getCallCost(F, NumArgs);		return Impl.getCallCost(F, NumArgs);
▲ Show 20 Lines • Show All 441 Lines • Show Last 20 Lines

include/llvm/Analysis/TargetTransformInfoImpl.h

Show First 20 Lines • Show All 46 Lines • ▼ Show 20 Lines	public:

unsigned getOperationCost(unsigned Opcode, Type Ty, Type OpTy) {		unsigned getOperationCost(unsigned Opcode, Type Ty, Type OpTy) {
switch (Opcode) {		switch (Opcode) {
default:		default:
// By default, just classify everything as 'basic'.		// By default, just classify everything as 'basic'.
return TTI::TCC_Basic;		return TTI::TCC_Basic;

case Instruction::GetElementPtr:		case Instruction::GetElementPtr:
llvm_unreachable("Use getGEPCost for GEP operations!");		llvm_unreachable("Use getGEPCost for GEP operations!");
		hfinkelUnsubmitted Not Done Reply Inline Actions This needs to be updated, or... At a high level, I'm not sure what we want to completely remove the version of the function that can be used without an existing function. Instead, we should add an overload, and then fall back to the existing code where relevant. hfinkel: This needs to be updated, or... At a high level, I'm not sure what we want to completely…
		junbumlAuthorUnsubmitted Not Done Reply Inline Actions I'm not perfectly clear about this. Do you think we should keep the existing getGEPCost as it is : int getGEPCost(Type PointeeType, const Value Ptr, ArrayRef<const Value > Operands), and add the new one : int getGEPCost(const GEPOperator GEP, ArrayRef<const Value > Operands) junbuml:* I'm not perfectly clear about this. Do you think we should keep the existing getGEPCost as it…
		hfinkelUnsubmitted Done Reply Inline Actions Yes. Then implement this new function so that it calls the instruction-independent version to handle the non-user-based logic. hfinkel: Yes. Then implement this new function so that it calls the instruction-independent version to…

case Instruction::BitCast:		case Instruction::BitCast:
assert(OpTy && "Cast instructions must provide the operand type");		assert(OpTy && "Cast instructions must provide the operand type");
if (Ty == OpTy \|\| (Ty->isPointerTy() && OpTy->isPointerTy()))		if (Ty == OpTy \|\| (Ty->isPointerTy() && OpTy->isPointerTy()))
// Identity and pointer-to-pointer casts are free.		// Identity and pointer-to-pointer casts are free.
return TTI::TCC_Free;		return TTI::TCC_Free;

// Otherwise, the default basic cost is used.		// Otherwise, the default basic cost is used.
▲ Show 20 Lines • Show All 657 Lines • ▼ Show 20 Lines	int getGEPCost(Type PointeeType, const Value Ptr,
if (static_cast<T *>(this)->isLegalAddressingMode(		if (static_cast<T *>(this)->isLegalAddressingMode(
TargetType, const_cast<GlobalValue *>(BaseGV),		TargetType, const_cast<GlobalValue *>(BaseGV),
static_cast<int64_t>(BaseOffset.getLimitedValue()), HasBaseReg,		static_cast<int64_t>(BaseOffset.getLimitedValue()), HasBaseReg,
Scale, AS))		Scale, AS))
return TTI::TCC_Free;		return TTI::TCC_Free;
return TTI::TCC_Basic;		return TTI::TCC_Basic;
}		}

		int getGEPCost(const GEPOperator GEP, ArrayRef<const Value > Operands) {
		if (!isa<Instruction>(GEP))
		return TTI::TCC_Basic;

		Type *PointeeType = GEP->getSourceElementType();
		const Value *Ptr = GEP->getPointerOperand();

		if (getGEPCost(PointeeType, Ptr, Operands) == TTI::TCC_Free) {
		// Should check if the GEP is actually used in load / store instructions.
		// For simplicity, we check only direct users of the GEP.
		hfinkelUnsubmitted Done Reply Inline Actions togetehr -> together hfinkel: togetehr -> together
		//
		// FIXME: GEPs could also be folded away as a part of addressing mode in
		hfinkelUnsubmitted Not Done Reply Inline Actions I don't understand this comment. If there's a sext/zext, then it would be an operand of the GEP, not the other way around, no? hfinkel: I don't understand this comment. If there's a sext/zext, then it would be an operand of the GEP…
		junbumlAuthorUnsubmitted Not Done Reply Inline Actions Yes, sext must be an operand of the GEP, not an user. Sorry for the confusion. Remove "sext" from the comment. junbuml: Yes, sext must be an operand of the GEP, not an user. Sorry for the confusion. Remove "sext"…
		// load/store instructions together with other instructions (e.g., other
		// GEPs). Handling all such cases must be expensive to be performed
		// in this function, so we stay conservative for now.
		for (const User *U : GEP->users()) {
		const Operator *UOP = cast<Operator>(U);
		const Value *PointerOperand = nullptr;
		if (auto *LI = dyn_cast<LoadInst>(UOP))
		PointerOperand = LI->getPointerOperand();
		else if (auto *SI = dyn_cast<StoreInst>(UOP))
		PointerOperand = SI->getPointerOperand();

		if ((!PointerOperand \|\| PointerOperand != GEP) &&
		!GEP->hasAllZeroIndices())
		return TTI::TCC_Basic;
		}
		return TTI::TCC_Free;
		}
		return TTI::TCC_Basic;
		}

using BaseT::getIntrinsicCost;		using BaseT::getIntrinsicCost;

unsigned getIntrinsicCost(Intrinsic::ID IID, Type *RetTy,		unsigned getIntrinsicCost(Intrinsic::ID IID, Type *RetTy,
ArrayRef<const Value *> Arguments) {		ArrayRef<const Value *> Arguments) {
// Delegate to the generic intrinsic handling code. This mostly provides an		// Delegate to the generic intrinsic handling code. This mostly provides an
// opportunity for targets to (for example) special case the cost of		// opportunity for targets to (for example) special case the cost of
// certain intrinsics based on constants used as arguments.		// certain intrinsics based on constants used as arguments.
SmallVector<Type *, 8> ParamTys;		SmallVector<Type *, 8> ParamTys;
ParamTys.reserve(Arguments.size());		ParamTys.reserve(Arguments.size());
for (unsigned Idx = 0, Size = Arguments.size(); Idx != Size; ++Idx)		for (unsigned Idx = 0, Size = Arguments.size(); Idx != Size; ++Idx)
ParamTys.push_back(Arguments[Idx]->getType());		ParamTys.push_back(Arguments[Idx]->getType());
return static_cast<T *>(this)->getIntrinsicCost(IID, RetTy, ParamTys);		return static_cast<T *>(this)->getIntrinsicCost(IID, RetTy, ParamTys);
}		}

unsigned getUserCost(const User U, ArrayRef<const Value > Operands) {		unsigned getUserCost(const User U, ArrayRef<const Value > Operands) {
if (isa<PHINode>(U))		if (isa<PHINode>(U))
return TTI::TCC_Free; // Model all PHI nodes as free.		return TTI::TCC_Free; // Model all PHI nodes as free.

// Static alloca doesn't generate target instructions.		// Static alloca doesn't generate target instructions.
if (auto *A = dyn_cast<AllocaInst>(U))		if (auto *A = dyn_cast<AllocaInst>(U))
if (A->isStaticAlloca())		if (A->isStaticAlloca())
return TTI::TCC_Free;		return TTI::TCC_Free;

if (const GEPOperator *GEP = dyn_cast<GEPOperator>(U)) {		if (const GEPOperator *GEP = dyn_cast<GEPOperator>(U))
return static_cast<T *>(this)->getGEPCost(GEP->getSourceElementType(),		return static_cast<T *>(this)->getGEPCost(GEP,
GEP->getPointerOperand(),
Operands.drop_front());		Operands.drop_front());
}

if (auto CS = ImmutableCallSite(U)) {		if (auto CS = ImmutableCallSite(U)) {
const Function *F = CS.getCalledFunction();		const Function *F = CS.getCalledFunction();
if (!F) {		if (!F) {
// Just use the called value type.		// Just use the called value type.
Type *FTy = CS.getCalledValue()->getType()->getPointerElementType();		Type *FTy = CS.getCalledValue()->getType()->getPointerElementType();
return static_cast<T *>(this)		return static_cast<T *>(this)
->getCallCost(cast<FunctionType>(FTy), CS.arg_size());		->getCallCost(cast<FunctionType>(FTy), CS.arg_size());
▲ Show 20 Lines • Show All 56 Lines • Show Last 20 Lines

include/llvm/CodeGen/BasicTTIImpl.h

Show First 20 Lines • Show All 183 Lines • ▼ Show 20 Lines	bool isTypeLegal(Type *Ty) {
return getTLI()->isTypeLegal(VT);		return getTLI()->isTypeLegal(VT);
}		}

int getGEPCost(Type PointeeType, const Value Ptr,		int getGEPCost(Type PointeeType, const Value Ptr,
ArrayRef<const Value *> Operands) {		ArrayRef<const Value *> Operands) {
return BaseT::getGEPCost(PointeeType, Ptr, Operands);		return BaseT::getGEPCost(PointeeType, Ptr, Operands);
}		}

		int getGEPCost(const GEPOperator *GEP,
		ArrayRef<const Value *> Operands) {
		return BaseT::getGEPCost(GEP, Operands);
		}

int getExtCost(const Instruction I, const Value Src) {		int getExtCost(const Instruction I, const Value Src) {
if (getTLI()->isExtFree(I))		if (getTLI()->isExtFree(I))
return TargetTransformInfo::TCC_Free;		return TargetTransformInfo::TCC_Free;

if (isa<ZExtInst>(I) \|\| isa<SExtInst>(I))		if (isa<ZExtInst>(I) \|\| isa<SExtInst>(I))
if (const LoadInst *LI = dyn_cast<LoadInst>(Src))		if (const LoadInst *LI = dyn_cast<LoadInst>(Src))
if (getTLI()->isExtLoad(LI, I, DL))		if (getTLI()->isExtLoad(LI, I, DL))
return TargetTransformInfo::TCC_Free;		return TargetTransformInfo::TCC_Free;
▲ Show 20 Lines • Show All 1,098 Lines • Show Last 20 Lines

include/llvm/IR/Operator.h

Show First 20 Lines • Show All 450 Lines • ▼ Show 20 Lines	public:
/// Return true if all of the indices of this GEP are zeros.		/// Return true if all of the indices of this GEP are zeros.
/// If so, the result pointer and the first operand have the same		/// If so, the result pointer and the first operand have the same
/// value, just potentially different types.		/// value, just potentially different types.
bool hasAllZeroIndices() const {		bool hasAllZeroIndices() const {
for (const_op_iterator I = idx_begin(), E = idx_end(); I != E; ++I) {		for (const_op_iterator I = idx_begin(), E = idx_end(); I != E; ++I) {
if (ConstantInt *C = dyn_cast<ConstantInt>(I))		if (ConstantInt *C = dyn_cast<ConstantInt>(I))
if (C->isZero())		if (C->isZero())
continue;		continue;
		if (isa<ConstantAggregateZero>(I))
		continue;
return false;		return false;
}		}
return true;		return true;
}		}

/// Return true if all of the indices of this GEP are constant integers.		/// Return true if all of the indices of this GEP are constant integers.
/// If so, the result pointer and the first operand have		/// If so, the result pointer and the first operand have
/// a constant offset between them.		/// a constant offset between them.
▲ Show 20 Lines • Show All 71 Lines • Show Last 20 Lines

lib/Analysis/TargetTransformInfo.cpp

Show First 20 Lines • Show All 82 Lines • ▼ Show 20 Lines	unsigned TargetTransformInfo::getInliningThresholdMultiplier() const {
return TTIImpl->getInliningThresholdMultiplier();		return TTIImpl->getInliningThresholdMultiplier();
}		}

int TargetTransformInfo::getGEPCost(Type PointeeType, const Value Ptr,		int TargetTransformInfo::getGEPCost(Type PointeeType, const Value Ptr,
ArrayRef<const Value *> Operands) const {		ArrayRef<const Value *> Operands) const {
return TTIImpl->getGEPCost(PointeeType, Ptr, Operands);		return TTIImpl->getGEPCost(PointeeType, Ptr, Operands);
}		}

		int TargetTransformInfo::getGEPCost(const GEPOperator *GEP,
		ArrayRef<const Value *> Operands) const {
		return TTIImpl->getGEPCost(GEP, Operands);
		}

int TargetTransformInfo::getExtCost(const Instruction *I,		int TargetTransformInfo::getExtCost(const Instruction *I,
const Value *Src) const {		const Value *Src) const {
return TTIImpl->getExtCost(I, Src);		return TTIImpl->getExtCost(I, Src);
}		}

int TargetTransformInfo::getIntrinsicCost(		int TargetTransformInfo::getIntrinsicCost(
Intrinsic::ID IID, Type RetTy, ArrayRef<const Value > Arguments) const {		Intrinsic::ID IID, Type RetTy, ArrayRef<const Value > Arguments) const {
int Cost = TTIImpl->getIntrinsicCost(IID, RetTy, Arguments);		int Cost = TTIImpl->getIntrinsicCost(IID, RetTy, Arguments);
▲ Show 20 Lines • Show All 1,097 Lines • Show Last 20 Lines

lib/Transforms/Scalar/NaryReassociate.cpp

Show First 20 Lines • Show All 258 Lines • ▼ Show 20 Lines	Instruction NaryReassociatePass::tryReassociate(Instruction I) {
}		}
}		}

static bool isGEPFoldable(GetElementPtrInst *GEP,		static bool isGEPFoldable(GetElementPtrInst *GEP,
const TargetTransformInfo *TTI) {		const TargetTransformInfo *TTI) {
SmallVector<const Value*, 4> Indices;		SmallVector<const Value*, 4> Indices;
for (auto I = GEP->idx_begin(); I != GEP->idx_end(); ++I)		for (auto I = GEP->idx_begin(); I != GEP->idx_end(); ++I)
Indices.push_back(*I);		Indices.push_back(*I);
return TTI->getGEPCost(GEP->getSourceElementType(), GEP->getPointerOperand(),		return TTI->getGEPCost(cast<GEPOperator>(GEP),
Indices) == TargetTransformInfo::TCC_Free;		Indices) == TargetTransformInfo::TCC_Free;
}		}

Instruction NaryReassociatePass::tryReassociateGEP(GetElementPtrInst GEP) {		Instruction NaryReassociatePass::tryReassociateGEP(GetElementPtrInst GEP) {
// Not worth reassociating GEP if it is foldable.		// Not worth reassociating GEP if it is foldable.
if (isGEPFoldable(GEP, TTI))		if (isGEPFoldable(GEP, TTI))
return nullptr;		return nullptr;

▲ Show 20 Lines • Show All 234 Lines • Show Last 20 Lines

lib/Transforms/Scalar/StraightLineStrengthReduce.cpp

Show First 20 Lines • Show All 233 Lines • ▼ Show 20 Lines	return (Basis.Ins != C.Ins && // skip the same instruction
Basis.CandidateKind == C.CandidateKind);		Basis.CandidateKind == C.CandidateKind);
}		}

static bool isGEPFoldable(GetElementPtrInst *GEP,		static bool isGEPFoldable(GetElementPtrInst *GEP,
const TargetTransformInfo *TTI) {		const TargetTransformInfo *TTI) {
SmallVector<const Value*, 4> Indices;		SmallVector<const Value*, 4> Indices;
for (auto I = GEP->idx_begin(); I != GEP->idx_end(); ++I)		for (auto I = GEP->idx_begin(); I != GEP->idx_end(); ++I)
Indices.push_back(*I);		Indices.push_back(*I);
return TTI->getGEPCost(GEP->getSourceElementType(), GEP->getPointerOperand(),		return TTI->getGEPCost(cast<GEPOperator>(GEP),
Indices) == TargetTransformInfo::TCC_Free;		Indices) == TargetTransformInfo::TCC_Free;
}		}

// Returns whether (Base + Index * Stride) can be folded to an addressing mode.		// Returns whether (Base + Index * Stride) can be folded to an addressing mode.
static bool isAddFoldable(const SCEV Base, ConstantInt Index, Value *Stride,		static bool isAddFoldable(const SCEV Base, ConstantInt Index, Value *Stride,
TargetTransformInfo *TTI) {		TargetTransformInfo *TTI) {
// Index->getSExtValue() may crash if Index is wider than 64-bit.		// Index->getSExtValue() may crash if Index is wider than 64-bit.
return Index->getBitWidth() <= 64 &&		return Index->getBitWidth() <= 64 &&
▲ Show 20 Lines • Show All 451 Lines • Show Last 20 Lines

test/Analysis/CostModel/AArch64/gep.ll

	Show First 20 Lines • Show All 284 Lines • ▼ Show 20 Lines

	define i64 @test36(i64* %p) {			define i64 @test36(i64* %p) {
	; CHECK-LABEL: test36			; CHECK-LABEL: test36
	; CHECK: cost of 1 for instruction: {{.}} getelementptr inbounds i64, i64			; CHECK: cost of 1 for instruction: {{.}} getelementptr inbounds i64, i64
	%a = getelementptr inbounds i64, i64* %p, i32 -512			%a = getelementptr inbounds i64, i64* %p, i32 -512
	%v = load i64, i64* %a			%v = load i64, i64* %a
	ret i64 %v			ret i64 %v
	}			}

				; CHECK-LABEL: test37
				; CHECK: cost of 1 for instruction: {{.}} = getelementptr inbounds i8, i8**
				define i8 @test37(i64 %j, i8** readonly %P) {
				entry:
				%arrayidx0 = getelementptr inbounds i8, i8* %P, i64 %j
				%l1 = call i8* @func(i8** %arrayidx0)
				ret i8 0
				}

				; CHECK-LABEL: test38
				; CHECK: cost of 1 for instruction: {{.}} = getelementptr inbounds i8, i8**
				define i8 @test38(i8** readonly %P) {
				entry:
				%arrayidx0 = getelementptr inbounds i8, i8* %P, i64 10
				%l1 = call i8* @func(i8** %arrayidx0)
				ret i8 0
				}

				; CHECK-LABEL:test39
				; CHECK: cost of 0 for instruction: {{.}} = getelementptr inbounds i8, i8**
				define i8 @test39(i8** readonly %P) {
				entry:
				%arrayidx0 = getelementptr inbounds i8, i8* %P, i64 0
				%l1 = call i8* @func(i8** %arrayidx0)
				ret i8 0
				}

				; CHECK-LABEL:test40
				; CHECK: cost of 1 for instruction: {{.}} = getelementptr inbounds i8, i8**
				define i8 @test40(i8 readonly %P) {
				entry:
				%arrayidx0 = getelementptr inbounds i8, i8* %P, i64 10
				ret i8** %arrayidx0
				}

				; CHECK-LABEL:test41
				; CHECK: cost of 1 for instruction: {{.}} = getelementptr inbounds i8, i8
				define i8 @test41(i8* %V, i8** readonly %P) {
				entry:
				%arrayidx0 = getelementptr inbounds i8, i8* %V, i64 10
				store i8* %arrayidx0, i8** %P
				ret i8 0
				}

				declare i8* @func(i8**)

test/Analysis/CostModel/X86/vector_gep.ll

	; RUN: opt < %s -cost-model -analyze -mtriple=x86_64-linux-unknown-unknown -mattr=+avx512f \| FileCheck %s			; RUN: opt < %s -cost-model -analyze -mtriple=x86_64-linux-unknown-unknown -mattr=+avx512f \| FileCheck %s

	%struct.S = type { [1000 x i32] }			%struct.S = type { [1000 x i32] }


	declare <4 x i32> @llvm.masked.gather.v4i32.v4p0i32(<4 x i32*>, i32, <4 x i1>, <4 x i32>)			declare <4 x i32> @llvm.masked.gather.v4i32.v4p0i32(<4 x i32*>, i32, <4 x i1>, <4 x i32>)

	define <4 x i32> @foov(<4 x %struct.S*> %s, i64 %base){			define <4 x i32> @foov(<4 x %struct.S*> %s, i64 %base){
	%temp = insertelement <4 x i64> undef, i64 %base, i32 0			%temp = insertelement <4 x i64> undef, i64 %base, i32 0
	%vector = shufflevector <4 x i64> %temp, <4 x i64> undef, <4 x i32> zeroinitializer			%vector = shufflevector <4 x i64> %temp, <4 x i64> undef, <4 x i32> zeroinitializer
	;CHECK: cost of 0 for instruction: {{.*}} getelementptr inbounds %struct.S			;CHECK: cost of 0 for instruction: {{.*}} getelementptr inbounds %struct.S
				junbumlAuthorUnsubmitted Not Done Reply Inline Actions With this patch, %B is changed to a non-free because it's used in %arrayidx (non-memory operation). It might be possible to continue checking users of the non-memory operation users, but doing this completely must be expensive to be done in getGEPCost. It might be possible to add some simple exceptions, but in this patch I didn't add such checks. junbuml: With this patch, %B is changed to a non-free because it's used in %arrayidx (non-memory…
				efriedmaUnsubmitted Not Done Reply Inline Actions Yes, it should be fine to avoid folding together GEPs in getUserCost(). (Arguably, you might want to, but it could get complicated, so okay to skip that for now.) That said, there's something going wrong here. "gep %x, 0, 0" is free because it's just a type conversion. By the same reasoning, "gep %s, zeroinitializer, zeroinitializer" should also be free. efriedma: Yes, it should be fine to avoid folding together GEPs in getUserCost(). (Arguably, you might…
				junbumlAuthorUnsubmitted Not Done Reply Inline Actions We might be able to handle zeroinlitializer in hasAllZeroIndices() for ArrayType. Then, I think it should be a separate patch. junbuml: We might be able to handle zeroinlitializer in hasAllZeroIndices() for ArrayType. Then, I…
				hfinkelUnsubmitted Done Reply Inline Actions Why a separate patch? This patch is not overly complicated, and if there's a separate patch we'll have a regression in between. If you want to separate the patches, we should have them both before either is committed. But it sounds like a couple lines of code and a few lines of code for some tests. hfinkel: Why a separate patch? This patch is not overly complicated, and if there's a separate patch…
	%B = getelementptr inbounds %struct.S, <4 x %struct.S*> %s, <4 x i32> zeroinitializer, <4 x i32> zeroinitializer			%B = getelementptr inbounds %struct.S, <4 x %struct.S*> %s, <4 x i32> zeroinitializer, <4 x i32> zeroinitializer
	;CHECK: cost of 0 for instruction: {{.*}} getelementptr inbounds [1000 x i32]			;CHECK: cost of 1 for instruction: {{.*}} getelementptr inbounds [1000 x i32]
	%arrayidx = getelementptr inbounds [1000 x i32], <4 x [1000 x i32]*> %B, <4 x i64> zeroinitializer, <4 x i64> %vector			%arrayidx = getelementptr inbounds [1000 x i32], <4 x [1000 x i32]*> %B, <4 x i64> zeroinitializer, <4 x i64> %vector
	%res = call <4 x i32> @llvm.masked.gather.v4i32.v4p0i32(<4 x i32*> %arrayidx, i32 4, <4 x i1> <i1 true, i1 true, i1 true, i1 true>, <4 x i32> undef)			%res = call <4 x i32> @llvm.masked.gather.v4i32.v4p0i32(<4 x i32*> %arrayidx, i32 4, <4 x i1> <i1 true, i1 true, i1 true, i1 true>, <4 x i32> undef)
	ret <4 x i32> %res			ret <4 x i32> %res
	}			}

test/Transforms/SimplifyCFG/SpeculativeExecGepCE.ll

This file was added.

				; RUN: opt < %s -simplifycfg -phi-node-folding-threshold=0 -S \| FileCheck %s

				target triple = "x86_64-unknown-linux-gnu"

				@d_buf = internal constant [8 x i8] [i8 126, i8 127, i8 128, i8 129, i8 130, i8 131, i8 132, i8 133], align 8
				@a = internal constant { i8, i64} {i8 getelementptr inbounds ([8 x i8], [8 x i8]* @d_buf, i64 0, i64 0), i64 0}

				; CHECK-LABEL: @test
				; CHECK-LABEL: end:
				; CHECK: %x1 = phi i8*
				define i8* @test(i1* %dummy, i8* %a, i8* %b, i8 %v) {

				entry:
				%cond1 = load volatile i1, i1* %dummy
				br i1 %cond1, label %if, label %end

				if:
				%cond2 = load volatile i1, i1* %dummy
				br i1 %cond2, label %then, label %end

				then:
				br label %end

				end:
				%x1 = phi i8* [ %a, %entry ], [ %b, %if ], [getelementptr inbounds ([8 x i8], [8 x i8]* @d_buf, i64 0, i64 0) , %then ]

				ret i8* %x1
				}

This is an archive of the discontinued LLVM Phabricator instance.

Use the basic cost if a GEP is not used as addressing mode
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 117572

include/llvm/Analysis/TargetTransformInfo.h

include/llvm/Analysis/TargetTransformInfoImpl.h

include/llvm/CodeGen/BasicTTIImpl.h

include/llvm/IR/Operator.h

lib/Analysis/TargetTransformInfo.cpp

lib/Transforms/Scalar/NaryReassociate.cpp

lib/Transforms/Scalar/StraightLineStrengthReduce.cpp

test/Analysis/CostModel/AArch64/gep.ll

test/Analysis/CostModel/X86/vector_gep.ll

test/Transforms/SimplifyCFG/SpeculativeExecGepCE.ll

This is an archive of the discontinued LLVM Phabricator instance.

Use the basic cost if a GEP is not used as addressing modeClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 117572

include/llvm/Analysis/TargetTransformInfo.h

include/llvm/Analysis/TargetTransformInfoImpl.h

include/llvm/CodeGen/BasicTTIImpl.h

include/llvm/IR/Operator.h

lib/Analysis/TargetTransformInfo.cpp

lib/Transforms/Scalar/NaryReassociate.cpp

lib/Transforms/Scalar/StraightLineStrengthReduce.cpp

test/Analysis/CostModel/AArch64/gep.ll

test/Analysis/CostModel/X86/vector_gep.ll

test/Transforms/SimplifyCFG/SpeculativeExecGepCE.ll

Use the basic cost if a GEP is not used as addressing mode
ClosedPublic