Diff 343832

llvm/lib/Target/X86/X86.td

Show First 20 Lines • Show All 508 Lines • ▼ Show 20 Lines	: SubtargetFeature<
"fast-scalar-shift-masks", "HasFastScalarShiftMasks", "true",		"fast-scalar-shift-masks", "HasFastScalarShiftMasks", "true",
"Prefer a left/right scalar logical shift pair over a shift+and pair">;		"Prefer a left/right scalar logical shift pair over a shift+and pair">;

def FeatureFastVectorShiftMasks		def FeatureFastVectorShiftMasks
: SubtargetFeature<		: SubtargetFeature<
"fast-vector-shift-masks", "HasFastVectorShiftMasks", "true",		"fast-vector-shift-masks", "HasFastVectorShiftMasks", "true",
"Prefer a left/right vector logical shift pair over a shift+and pair">;		"Prefer a left/right vector logical shift pair over a shift+and pair">;

		def FeatureFastMOVBE
		: SubtargetFeature<"fast-movbe", "HasFastMOVBE", "true",
		"Prefer a movbe over a single-use load + bswap / single-use bswap + store">;
		RKSimonUnsubmitted Done Reply Inline Actions You say 'prefer' - is a future intention to alter isel depending on this? I'm not sure that's actually useful. RKSimon: You say 'prefer' - is a future intention to alter isel depending on this? I'm not sure that's…
		lebedev.riAuthorUnsubmitted Done Reply Inline Actions You say 'prefer' - is a future intention to alter isel depending on this? Not really. I was only interested in doing what is contained in this patch, i.e. modelling bswap as free in costmodel, if it will be free. lebedev.ri: > You say 'prefer' - is a future intention to alter isel depending on this? Not really. I was…
		RKSimonUnsubmitted Done Reply Inline Actions I guess technically different codegen might still occur if the costs come out slightly different and the vectorizer 'prefers' scalar code - sorry for the noise. RKSimon: I guess technically different codegen might still occur if the costs come out slightly…
		lebedev.riAuthorUnsubmitted Done Reply Inline Actions That wasn't noise. "Do you intend to prohibit formation of movbe if not HasFastMOVBE" seems like a good question. (i do not.) lebedev.ri: That wasn't noise. "Do you intend to prohibit formation of movbe if not HasFastMOVBE" seems…

def FeatureUseGLMDivSqrtCosts		def FeatureUseGLMDivSqrtCosts
: SubtargetFeature<"use-glm-div-sqrt-costs", "UseGLMDivSqrtCosts", "true",		: SubtargetFeature<"use-glm-div-sqrt-costs", "UseGLMDivSqrtCosts", "true",
"Use Goldmont specific floating point div/sqrt costs">;		"Use Goldmont specific floating point div/sqrt costs">;

// Enable use of alias analysis during code generation.		// Enable use of alias analysis during code generation.
def FeatureUseAA : SubtargetFeature<"use-aa", "UseAA", "true",		def FeatureUseAA : SubtargetFeature<"use-aa", "UseAA", "true",
"Use alias analysis during codegen">;		"Use alias analysis during codegen">;

▲ Show 20 Lines • Show All 290 Lines • ▼ Show 20 Lines	list<SubtargetFeature> SLMAdditionalFeatures = [FeatureSSE42,
FeatureRDRAND];		FeatureRDRAND];
list<SubtargetFeature> SLMTuning = [ProcIntelSLM,		list<SubtargetFeature> SLMTuning = [ProcIntelSLM,
FeatureSlowTwoMemOps,		FeatureSlowTwoMemOps,
FeatureSlowLEA,		FeatureSlowLEA,
FeatureSlowIncDec,		FeatureSlowIncDec,
FeatureSlowDivide64,		FeatureSlowDivide64,
FeatureSlowPMULLD,		FeatureSlowPMULLD,
FeatureFast7ByteNOP,		FeatureFast7ByteNOP,
		FeatureFastMOVBE,
FeaturePOPCNTFalseDeps,		FeaturePOPCNTFalseDeps,
FeatureInsertVZEROUPPER];		FeatureInsertVZEROUPPER];
list<SubtargetFeature> SLMFeatures =		list<SubtargetFeature> SLMFeatures =
!listconcat(AtomFeatures, SLMAdditionalFeatures);		!listconcat(AtomFeatures, SLMAdditionalFeatures);

// Goldmont		// Goldmont
list<SubtargetFeature> GLMAdditionalFeatures = [FeatureAES,		list<SubtargetFeature> GLMAdditionalFeatures = [FeatureAES,
FeatureSHA,		FeatureSHA,
FeatureRDSEED,		FeatureRDSEED,
FeatureXSAVE,		FeatureXSAVE,
FeatureXSAVEOPT,		FeatureXSAVEOPT,
FeatureXSAVEC,		FeatureXSAVEC,
FeatureXSAVES,		FeatureXSAVES,
FeatureCLFLUSHOPT,		FeatureCLFLUSHOPT,
FeatureFSGSBase];		FeatureFSGSBase];
list<SubtargetFeature> GLMTuning = [FeatureUseGLMDivSqrtCosts,		list<SubtargetFeature> GLMTuning = [FeatureUseGLMDivSqrtCosts,
FeatureSlowTwoMemOps,		FeatureSlowTwoMemOps,
FeatureSlowLEA,		FeatureSlowLEA,
FeatureSlowIncDec,		FeatureSlowIncDec,
		FeatureFastMOVBE,
FeaturePOPCNTFalseDeps,		FeaturePOPCNTFalseDeps,
FeatureInsertVZEROUPPER];		FeatureInsertVZEROUPPER];
list<SubtargetFeature> GLMFeatures =		list<SubtargetFeature> GLMFeatures =
!listconcat(SLMFeatures, GLMAdditionalFeatures);		!listconcat(SLMFeatures, GLMAdditionalFeatures);

// Goldmont Plus		// Goldmont Plus
list<SubtargetFeature> GLPAdditionalFeatures = [FeaturePTWRITE,		list<SubtargetFeature> GLPAdditionalFeatures = [FeaturePTWRITE,
FeatureRDPID];		FeatureRDPID];
list<SubtargetFeature> GLPTuning = [FeatureUseGLMDivSqrtCosts,		list<SubtargetFeature> GLPTuning = [FeatureUseGLMDivSqrtCosts,
FeatureSlowTwoMemOps,		FeatureSlowTwoMemOps,
FeatureSlowLEA,		FeatureSlowLEA,
FeatureSlowIncDec,		FeatureSlowIncDec,
		FeatureFastMOVBE,
FeatureInsertVZEROUPPER];		FeatureInsertVZEROUPPER];
list<SubtargetFeature> GLPFeatures =		list<SubtargetFeature> GLPFeatures =
!listconcat(GLMFeatures, GLPAdditionalFeatures);		!listconcat(GLMFeatures, GLPAdditionalFeatures);

// Tremont		// Tremont
list<SubtargetFeature> TRMAdditionalFeatures = [FeatureCLWB,		list<SubtargetFeature> TRMAdditionalFeatures = [FeatureCLWB,
FeatureGFNI];		FeatureGFNI];
list<SubtargetFeature> TRMTuning = GLPTuning;		list<SubtargetFeature> TRMTuning = GLPTuning;
▲ Show 20 Lines • Show All 57 Lines • ▼ Show 20 Lines	list<SubtargetFeature> KNLFeatures = [FeatureX87,
FeatureFMA,		FeatureFMA,
FeaturePRFCHW];		FeaturePRFCHW];
list<SubtargetFeature> KNLTuning = [FeatureSlowDivide64,		list<SubtargetFeature> KNLTuning = [FeatureSlowDivide64,
FeatureSlow3OpsLEA,		FeatureSlow3OpsLEA,
FeatureSlowIncDec,		FeatureSlowIncDec,
FeatureSlowTwoMemOps,		FeatureSlowTwoMemOps,
FeaturePreferMaskRegisters,		FeaturePreferMaskRegisters,
FeatureHasFastGather,		FeatureHasFastGather,
		FeatureFastMOVBE,
FeatureSlowPMADDWD];		FeatureSlowPMADDWD];
// TODO Add AVX5124FMAPS/AVX5124VNNIW features		// TODO Add AVX5124FMAPS/AVX5124VNNIW features
list<SubtargetFeature> KNMFeatures =		list<SubtargetFeature> KNMFeatures =
!listconcat(KNLFeatures, [FeatureVPOPCNTDQ]);		!listconcat(KNLFeatures, [FeatureVPOPCNTDQ]);

// Barcelona		// Barcelona
list<SubtargetFeature> BarcelonaFeatures = [FeatureX87,		list<SubtargetFeature> BarcelonaFeatures = [FeatureX87,
FeatureCMPXCHG8B,		FeatureCMPXCHG8B,
▲ Show 20 Lines • Show All 43 Lines • ▼ Show 20 Lines	list<SubtargetFeature> BtVer2AdditionalFeatures = [FeatureAVX,
FeatureXSAVE,		FeatureXSAVE,
FeatureXSAVEOPT];		FeatureXSAVEOPT];
list<SubtargetFeature> BtVer2Tuning = [FeatureFastLZCNT,		list<SubtargetFeature> BtVer2Tuning = [FeatureFastLZCNT,
FeatureFastBEXTR,		FeatureFastBEXTR,
FeatureFastHorizontalOps,		FeatureFastHorizontalOps,
FeatureFast15ByteNOP,		FeatureFast15ByteNOP,
FeatureFastScalarShiftMasks,		FeatureFastScalarShiftMasks,
FeatureFastVectorShiftMasks,		FeatureFastVectorShiftMasks,
		FeatureFastMOVBE,
FeatureSlowSHLD];		FeatureSlowSHLD];
list<SubtargetFeature> BtVer2Features =		list<SubtargetFeature> BtVer2Features =
!listconcat(BtVer1Features, BtVer2AdditionalFeatures);		!listconcat(BtVer1Features, BtVer2AdditionalFeatures);

// Bulldozer		// Bulldozer
list<SubtargetFeature> BdVer1Features = [FeatureX87,		list<SubtargetFeature> BdVer1Features = [FeatureX87,
FeatureCMPXCHG8B,		FeatureCMPXCHG8B,
FeatureCMOV,		FeatureCMOV,
Show All 18 Lines	list<SubtargetFeature> BdVer1Tuning = [FeatureSlowSHLD,
FeatureInsertVZEROUPPER];		FeatureInsertVZEROUPPER];

// PileDriver		// PileDriver
list<SubtargetFeature> BdVer2AdditionalFeatures = [FeatureF16C,		list<SubtargetFeature> BdVer2AdditionalFeatures = [FeatureF16C,
FeatureBMI,		FeatureBMI,
FeatureTBM,		FeatureTBM,
FeatureFMA,		FeatureFMA,
FeatureFastBEXTR];		FeatureFastBEXTR];
list<SubtargetFeature> BdVer2Tuning = BdVer1Tuning;		list<SubtargetFeature> BdVer2AdditionalTuning = [FeatureFastMOVBE];
		list<SubtargetFeature> BdVer2Tuning =
		!listconcat(BdVer1Tuning, BdVer2AdditionalTuning);
list<SubtargetFeature> BdVer2Features =		list<SubtargetFeature> BdVer2Features =
!listconcat(BdVer1Features, BdVer2AdditionalFeatures);		!listconcat(BdVer1Features, BdVer2AdditionalFeatures);

// Steamroller		// Steamroller
list<SubtargetFeature> BdVer3AdditionalFeatures = [FeatureXSAVEOPT,		list<SubtargetFeature> BdVer3AdditionalFeatures = [FeatureXSAVEOPT,
FeatureFSGSBase];		FeatureFSGSBase];
list<SubtargetFeature> BdVer3Tuning = BdVer2Tuning;		list<SubtargetFeature> BdVer3Tuning = BdVer2Tuning;
list<SubtargetFeature> BdVer3Features =		list<SubtargetFeature> BdVer3Features =
▲ Show 20 Lines • Show All 43 Lines • ▼ Show 20 Lines	list<SubtargetFeature> ZNFeatures = [FeatureADX,
FeatureXSAVEC,		FeatureXSAVEC,
FeatureXSAVEOPT,		FeatureXSAVEOPT,
FeatureXSAVES];		FeatureXSAVES];
list<SubtargetFeature> ZNTuning = [FeatureFastLZCNT,		list<SubtargetFeature> ZNTuning = [FeatureFastLZCNT,
FeatureFastBEXTR,		FeatureFastBEXTR,
FeatureFast15ByteNOP,		FeatureFast15ByteNOP,
FeatureBranchFusion,		FeatureBranchFusion,
FeatureFastScalarShiftMasks,		FeatureFastScalarShiftMasks,
		FeatureFastMOVBE,
FeatureSlowSHLD,		FeatureSlowSHLD,
FeatureInsertVZEROUPPER];		FeatureInsertVZEROUPPER];
list<SubtargetFeature> ZN2AdditionalFeatures = [FeatureCLWB,		list<SubtargetFeature> ZN2AdditionalFeatures = [FeatureCLWB,
FeatureRDPID,		FeatureRDPID,
FeatureWBNOINVD];		FeatureWBNOINVD];
list<SubtargetFeature> ZN2Tuning = ZNTuning;		list<SubtargetFeature> ZN2Tuning = ZNTuning;
list<SubtargetFeature> ZN2Features =		list<SubtargetFeature> ZN2Features =
!listconcat(ZNFeatures, ZN2AdditionalFeatures);		!listconcat(ZNFeatures, ZN2AdditionalFeatures);
▲ Show 20 Lines • Show All 408 Lines • Show Last 20 Lines

llvm/lib/Target/X86/X86Subtarget.h

Show First 20 Lines • Show All 427 Lines • ▼ Show 20 Lines	class X86Subtarget final : public X86GenSubtargetInfo {
bool HasFastHorizontalOps = false;		bool HasFastHorizontalOps = false;

/// Prefer a left/right scalar logical shifts pair over a shift+and pair.		/// Prefer a left/right scalar logical shifts pair over a shift+and pair.
bool HasFastScalarShiftMasks = false;		bool HasFastScalarShiftMasks = false;

/// Prefer a left/right vector logical shifts pair over a shift+and pair.		/// Prefer a left/right vector logical shifts pair over a shift+and pair.
bool HasFastVectorShiftMasks = false;		bool HasFastVectorShiftMasks = false;

		/// Prefer a movbe over a single-use load + bswap / single-use bswap + store.
		bool HasFastMOVBE = false;

/// Use a retpoline thunk rather than indirect calls to block speculative		/// Use a retpoline thunk rather than indirect calls to block speculative
/// execution.		/// execution.
bool UseRetpolineIndirectCalls = false;		bool UseRetpolineIndirectCalls = false;

/// Use a retpoline thunk or remove any indirect branch to block speculative		/// Use a retpoline thunk or remove any indirect branch to block speculative
/// execution.		/// execution.
bool UseRetpolineIndirectBranches = false;		bool UseRetpolineIndirectBranches = false;

▲ Show 20 Lines • Show All 265 Lines • ▼ Show 20 Lines	public:
bool hasFastScalarFSQRT() const { return HasFastScalarFSQRT; }		bool hasFastScalarFSQRT() const { return HasFastScalarFSQRT; }
bool hasFastVectorFSQRT() const { return HasFastVectorFSQRT; }		bool hasFastVectorFSQRT() const { return HasFastVectorFSQRT; }
bool hasFastLZCNT() const { return HasFastLZCNT; }		bool hasFastLZCNT() const { return HasFastLZCNT; }
bool hasFastSHLDRotate() const { return HasFastSHLDRotate; }		bool hasFastSHLDRotate() const { return HasFastSHLDRotate; }
bool hasFastBEXTR() const { return HasFastBEXTR; }		bool hasFastBEXTR() const { return HasFastBEXTR; }
bool hasFastHorizontalOps() const { return HasFastHorizontalOps; }		bool hasFastHorizontalOps() const { return HasFastHorizontalOps; }
bool hasFastScalarShiftMasks() const { return HasFastScalarShiftMasks; }		bool hasFastScalarShiftMasks() const { return HasFastScalarShiftMasks; }
bool hasFastVectorShiftMasks() const { return HasFastVectorShiftMasks; }		bool hasFastVectorShiftMasks() const { return HasFastVectorShiftMasks; }
		bool hasFastMOVBE() const { return HasFastMOVBE; }
bool hasMacroFusion() const { return HasMacroFusion; }		bool hasMacroFusion() const { return HasMacroFusion; }
bool hasBranchFusion() const { return HasBranchFusion; }		bool hasBranchFusion() const { return HasBranchFusion; }
bool hasERMSB() const { return HasERMSB; }		bool hasERMSB() const { return HasERMSB; }
bool hasFSRM() const { return HasFSRM; }		bool hasFSRM() const { return HasFSRM; }
bool hasSlowDivide32() const { return HasSlowDivide32; }		bool hasSlowDivide32() const { return HasSlowDivide32; }
bool hasSlowDivide64() const { return HasSlowDivide64; }		bool hasSlowDivide64() const { return HasSlowDivide64; }
bool padShortFunctions() const { return PadShortFunctions; }		bool padShortFunctions() const { return PadShortFunctions; }
bool slowTwoMemOps() const { return SlowTwoMemOps; }		bool slowTwoMemOps() const { return SlowTwoMemOps; }
▲ Show 20 Lines • Show All 225 Lines • Show Last 20 Lines

llvm/lib/Target/X86/X86TargetTransformInfo.cpp

Show First 20 Lines • Show All 2,689 Lines • ▼ Show 20 Lines	X86TTIImpl::getTypeBasedIntrinsicInstrCost(const IntrinsicCostAttributes &ICA,
static const CostTblEntry POPCNT32CostTbl[] = { // 32 or 64-bit targets		static const CostTblEntry POPCNT32CostTbl[] = { // 32 or 64-bit targets
{ ISD::CTPOP, MVT::i32, 1 },		{ ISD::CTPOP, MVT::i32, 1 },
{ ISD::CTPOP, MVT::i16, 1 },		{ ISD::CTPOP, MVT::i16, 1 },
{ ISD::CTPOP, MVT::i8, 1 },		{ ISD::CTPOP, MVT::i8, 1 },
};		};
static const CostTblEntry X64CostTbl[] = { // 64-bit targets		static const CostTblEntry X64CostTbl[] = { // 64-bit targets
{ ISD::ABS, MVT::i64, 2 }, // SUB+CMOV		{ ISD::ABS, MVT::i64, 2 }, // SUB+CMOV
{ ISD::BITREVERSE, MVT::i64, 14 },		{ ISD::BITREVERSE, MVT::i64, 14 },
		{ ISD::BSWAP, MVT::i64, 1 },
{ ISD::CTLZ, MVT::i64, 4 }, // BSR+XOR or BSR+XOR+CMOV		{ ISD::CTLZ, MVT::i64, 4 }, // BSR+XOR or BSR+XOR+CMOV
{ ISD::CTTZ, MVT::i64, 3 }, // TEST+BSF+CMOV/BRANCH		{ ISD::CTTZ, MVT::i64, 3 }, // TEST+BSF+CMOV/BRANCH
{ ISD::CTPOP, MVT::i64, 10 },		{ ISD::CTPOP, MVT::i64, 10 },
{ ISD::SADDO, MVT::i64, 1 },		{ ISD::SADDO, MVT::i64, 1 },
{ ISD::UADDO, MVT::i64, 1 },		{ ISD::UADDO, MVT::i64, 1 },
{ ISD::UMULO, MVT::i64, 2 }, // mulq + seto		{ ISD::UMULO, MVT::i64, 2 }, // mulq + seto
};		};
static const CostTblEntry X86CostTbl[] = { // 32 or 64-bit targets		static const CostTblEntry X86CostTbl[] = { // 32 or 64-bit targets
{ ISD::ABS, MVT::i32, 2 }, // SUB+CMOV		{ ISD::ABS, MVT::i32, 2 }, // SUB+CMOV
{ ISD::ABS, MVT::i16, 2 }, // SUB+CMOV		{ ISD::ABS, MVT::i16, 2 }, // SUB+CMOV
{ ISD::BITREVERSE, MVT::i32, 14 },		{ ISD::BITREVERSE, MVT::i32, 14 },
{ ISD::BITREVERSE, MVT::i16, 14 },		{ ISD::BITREVERSE, MVT::i16, 14 },
{ ISD::BITREVERSE, MVT::i8, 11 },		{ ISD::BITREVERSE, MVT::i8, 11 },
		{ ISD::BSWAP, MVT::i32, 1 },
		{ ISD::BSWAP, MVT::i16, 1 }, // ROL
{ ISD::CTLZ, MVT::i32, 4 }, // BSR+XOR or BSR+XOR+CMOV		{ ISD::CTLZ, MVT::i32, 4 }, // BSR+XOR or BSR+XOR+CMOV
{ ISD::CTLZ, MVT::i16, 4 }, // BSR+XOR or BSR+XOR+CMOV		{ ISD::CTLZ, MVT::i16, 4 }, // BSR+XOR or BSR+XOR+CMOV
{ ISD::CTLZ, MVT::i8, 4 }, // BSR+XOR or BSR+XOR+CMOV		{ ISD::CTLZ, MVT::i8, 4 }, // BSR+XOR or BSR+XOR+CMOV
{ ISD::CTTZ, MVT::i32, 3 }, // TEST+BSF+CMOV/BRANCH		{ ISD::CTTZ, MVT::i32, 3 }, // TEST+BSF+CMOV/BRANCH
{ ISD::CTTZ, MVT::i16, 3 }, // TEST+BSF+CMOV/BRANCH		{ ISD::CTTZ, MVT::i16, 3 }, // TEST+BSF+CMOV/BRANCH
{ ISD::CTTZ, MVT::i8, 3 }, // TEST+BSF+CMOV/BRANCH		{ ISD::CTTZ, MVT::i8, 3 }, // TEST+BSF+CMOV/BRANCH
{ ISD::CTPOP, MVT::i32, 8 },		{ ISD::CTPOP, MVT::i32, 8 },
{ ISD::CTPOP, MVT::i16, 9 },		{ ISD::CTPOP, MVT::i16, 9 },
▲ Show 20 Lines • Show All 195 Lines • ▼ Show 20 Lines	if (ST->hasPOPCNT()) {
if (ST->is64Bit())		if (ST->is64Bit())
if (const auto *Entry = CostTableLookup(POPCNT64CostTbl, ISD, MTy))		if (const auto *Entry = CostTableLookup(POPCNT64CostTbl, ISD, MTy))
return adjustTableCost(*Entry, LT.first, ICA.getFlags());		return adjustTableCost(*Entry, LT.first, ICA.getFlags());

if (const auto *Entry = CostTableLookup(POPCNT32CostTbl, ISD, MTy))		if (const auto *Entry = CostTableLookup(POPCNT32CostTbl, ISD, MTy))
return adjustTableCost(*Entry, LT.first, ICA.getFlags());		return adjustTableCost(*Entry, LT.first, ICA.getFlags());
}		}

		if (ISD == ISD::BSWAP && ST->hasMOVBE() && ST->hasFastMOVBE()) {
		if (const Instruction *II = ICA.getInst()) {
		if (II->hasOneUse() && isa<StoreInst>(II->user_back()))
		craig.topperUnsubmitted Done Reply Inline Actions At least on Intel Core CPUs, MOVBE isn't optimized. It's a load or store and a bswap operation. Maybe it's optimized on Atom/Silvermont/Goldmont? It was added to that line of CPU first possibly because those CPUs have been used in networking equipment. craig.topper: At least on Intel Core CPUs, MOVBE isn't optimized. It's a load or store and a bswap operation.
		lebedev.riAuthorUnsubmitted Done Reply Inline Actions Looking at actual AMD Zen3 measurements, `movbe r<-m` is `1` uop, while `movbe m<-r` is `2`, which is actually a regression from Zen2/Zen1, as per https://www.agner.org/optimize/instruction_tables.pdf. As per that table, both are really slow on haswell/broadwell/skylake, but fast on Silvermont/Goldmont/KNL. So i think we could mark `movbe r<-m` on AMD's at least. lebedev.ri: Looking at actual AMD Zen3 measurements, `movbe r<-m` is `1` uop, while `movbe m<-r` is `2`…
		lebedev.riAuthorUnsubmitted Done Reply Inline Actions So i think we could mark `movbe r<-m` as free on AMD's at least. lebedev.ri: So i think we could mark `movbe r<-m` as free on AMD's at least.
		return TTI::TCC_Free;
		if (auto *LI = dyn_cast<LoadInst>(II->getOperand(0))) {
		if (LI->hasOneUse())
		return TTI::TCC_Free;
		}
		}
		}

// TODO - add BMI (TZCNT) scalar handling		// TODO - add BMI (TZCNT) scalar handling

if (ST->is64Bit())		if (ST->is64Bit())
if (const auto *Entry = CostTableLookup(X64CostTbl, ISD, MTy))		if (const auto *Entry = CostTableLookup(X64CostTbl, ISD, MTy))
return adjustTableCost(*Entry, LT.first, ICA.getFlags());		return adjustTableCost(*Entry, LT.first, ICA.getFlags());

if (const auto *Entry = CostTableLookup(X86CostTbl, ISD, MTy))		if (const auto *Entry = CostTableLookup(X86CostTbl, ISD, MTy))
return adjustTableCost(*Entry, LT.first, ICA.getFlags());		return adjustTableCost(*Entry, LT.first, ICA.getFlags());
▲ Show 20 Lines • Show All 1,894 Lines • Show Last 20 Lines

llvm/test/Analysis/CostModel/X86/bswap-store.ll

	; NOTE: Assertions have been autogenerated by utils/update_analyze_test_checks.py			; NOTE: Assertions have been autogenerated by utils/update_analyze_test_checks.py
	; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -cost-model -analyze \| FileCheck %s --check-prefixes=ALL,NOMOVBE,X64			; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -cost-model -analyze \| FileCheck %s --check-prefixes=ALL,X64
	; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -cost-model -analyze -mattr=+movbe \| FileCheck %s --check-prefixes=ALL,MOVBE,X64			; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -cost-model -analyze -mattr=+movbe \| FileCheck %s --check-prefixes=ALL,X64-MOVBE
	; RUN: opt < %s -mtriple=i686-unknown-linux-gnu -cost-model -analyze \| FileCheck %s --check-prefixes=ALL,NOMOVBE,X86			; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -cost-model -analyze -mattr=+movbe,+fast-movbe \| FileCheck %s --check-prefixes=ALL,X64-FASTMOVBE
	; RUN: opt < %s -mtriple=i686-unknown-linux-gnu -cost-model -analyze -mattr=+movbe \| FileCheck %s --check-prefixes=ALL,MOVBE,X86
				; RUN: opt < %s -mtriple=i686-unknown-linux-gnu -cost-model -analyze \| FileCheck %s --check-prefixes=ALL,X32
				; RUN: opt < %s -mtriple=i686-unknown-linux-gnu -cost-model -analyze -mattr=+movbe \| FileCheck %s --check-prefixes=ALL,X32-MOVBE
				; RUN: opt < %s -mtriple=i686-unknown-linux-gnu -cost-model -analyze -mattr=+movbe,+fast-movbe \| FileCheck %s --check-prefixes=ALL,X32-FASTMOVBE

	declare i16 @llvm.bswap.i16(i16)			declare i16 @llvm.bswap.i16(i16)
	declare i32 @llvm.bswap.i32(i32)			declare i32 @llvm.bswap.i32(i32)
	declare i64 @llvm.bswap.i64(i64)			declare i64 @llvm.bswap.i64(i64)
	declare i128 @llvm.bswap.i128(i128)			declare i128 @llvm.bswap.i128(i128)

	define void @var_bswap_store_i16(i16 %a, i16* %dst) {			define void @var_bswap_store_i16(i16 %a, i16* %dst) {
	; NOMOVBE-LABEL: 'var_bswap_store_i16'			; X64-LABEL: 'var_bswap_store_i16'
	; NOMOVBE-NEXT: Cost Model: Found an estimated cost of 10 for instruction: %bswap = call i16 @llvm.bswap.i16(i16 %a)			; X64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i16 @llvm.bswap.i16(i16 %a)
	; NOMOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i16 %bswap, i16* %dst, align 1			; X64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i16 %bswap, i16* %dst, align 1
	; NOMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void			; X64-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
	;			;
	; MOVBE-LABEL: 'var_bswap_store_i16'			; X64-MOVBE-LABEL: 'var_bswap_store_i16'
	; MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i16 @llvm.bswap.i16(i16 %a)			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i16 @llvm.bswap.i16(i16 %a)
	; MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i16 %bswap, i16* %dst, align 1			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i16 %bswap, i16* %dst, align 1
	; MOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
				;
				; X64-FASTMOVBE-LABEL: 'var_bswap_store_i16'
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %bswap = call i16 @llvm.bswap.i16(i16 %a)
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i16 %bswap, i16* %dst, align 1
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
				;
				; X32-LABEL: 'var_bswap_store_i16'
				; X32-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i16 @llvm.bswap.i16(i16 %a)
				; X32-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i16 %bswap, i16* %dst, align 1
				; X32-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
				;
				; X32-MOVBE-LABEL: 'var_bswap_store_i16'
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i16 @llvm.bswap.i16(i16 %a)
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i16 %bswap, i16* %dst, align 1
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
				;
				; X32-FASTMOVBE-LABEL: 'var_bswap_store_i16'
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %bswap = call i16 @llvm.bswap.i16(i16 %a)
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i16 %bswap, i16* %dst, align 1
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
	;			;
	%bswap = call i16 @llvm.bswap.i16(i16 %a)			%bswap = call i16 @llvm.bswap.i16(i16 %a)
	store i16 %bswap, i16* %dst, align 1			store i16 %bswap, i16* %dst, align 1

	ret void			ret void
	}			}
	define void @var_bswap_store_i16_extrause(i16 %a, i16* %dst) {			define void @var_bswap_store_i16_extrause(i16 %a, i16* %dst) {
	; NOMOVBE-LABEL: 'var_bswap_store_i16_extrause'			; ALL-LABEL: 'var_bswap_store_i16_extrause'
	; NOMOVBE-NEXT: Cost Model: Found an estimated cost of 10 for instruction: %bswap = call i16 @llvm.bswap.i16(i16 %a)			; ALL-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i16 @llvm.bswap.i16(i16 %a)
	; NOMOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i16 %bswap, i16* %dst, align 1			; ALL-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i16 %bswap, i16* %dst, align 1
	; NOMOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap2 = shl i16 %bswap, 2			; ALL-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap2 = shl i16 %bswap, 2
	; NOMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void			; ALL-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
	;
	; MOVBE-LABEL: 'var_bswap_store_i16_extrause'
	; MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i16 @llvm.bswap.i16(i16 %a)
	; MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i16 %bswap, i16* %dst, align 1
	; MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap2 = shl i16 %bswap, 2
	; MOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
	;			;
	%bswap = call i16 @llvm.bswap.i16(i16 %a)			%bswap = call i16 @llvm.bswap.i16(i16 %a)
	store i16 %bswap, i16* %dst, align 1			store i16 %bswap, i16* %dst, align 1

	%bswap2 = shl i16 %bswap, 2 ; incur an extra use to the bswap			%bswap2 = shl i16 %bswap, 2 ; incur an extra use to the bswap

	ret void			ret void
	}			}

	define void @var_bswap_store_i32(i32 %a, i32* %dst) {			define void @var_bswap_store_i32(i32 %a, i32* %dst) {
	; ALL-LABEL: 'var_bswap_store_i32'			; X64-LABEL: 'var_bswap_store_i32'
	; ALL-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i32 @llvm.bswap.i32(i32 %a)			; X64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i32 @llvm.bswap.i32(i32 %a)
	; ALL-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i32 %bswap, i32* %dst, align 1			; X64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i32 %bswap, i32* %dst, align 1
	; ALL-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void			; X64-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
				;
				; X64-MOVBE-LABEL: 'var_bswap_store_i32'
				; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i32 @llvm.bswap.i32(i32 %a)
				; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i32 %bswap, i32* %dst, align 1
				; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
				;
				; X64-FASTMOVBE-LABEL: 'var_bswap_store_i32'
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %bswap = call i32 @llvm.bswap.i32(i32 %a)
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i32 %bswap, i32* %dst, align 1
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
				;
				; X32-LABEL: 'var_bswap_store_i32'
				; X32-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i32 @llvm.bswap.i32(i32 %a)
				; X32-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i32 %bswap, i32* %dst, align 1
				; X32-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
				;
				; X32-MOVBE-LABEL: 'var_bswap_store_i32'
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i32 @llvm.bswap.i32(i32 %a)
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i32 %bswap, i32* %dst, align 1
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
				;
				; X32-FASTMOVBE-LABEL: 'var_bswap_store_i32'
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %bswap = call i32 @llvm.bswap.i32(i32 %a)
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i32 %bswap, i32* %dst, align 1
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
	;			;
	%bswap = call i32 @llvm.bswap.i32(i32 %a)			%bswap = call i32 @llvm.bswap.i32(i32 %a)
	store i32 %bswap, i32* %dst, align 1			store i32 %bswap, i32* %dst, align 1

	ret void			ret void
	}			}
	define void @var_bswap_store_i32_extrause(i32 %a, i32* %dst) {			define void @var_bswap_store_i32_extrause(i32 %a, i32* %dst) {
	; ALL-LABEL: 'var_bswap_store_i32_extrause'			; ALL-LABEL: 'var_bswap_store_i32_extrause'
	; ALL-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i32 @llvm.bswap.i32(i32 %a)			; ALL-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i32 @llvm.bswap.i32(i32 %a)
	; ALL-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i32 %bswap, i32* %dst, align 1			; ALL-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i32 %bswap, i32* %dst, align 1
	; ALL-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap2 = shl i32 %bswap, 2			; ALL-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap2 = shl i32 %bswap, 2
	; ALL-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void			; ALL-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
	;			;
	%bswap = call i32 @llvm.bswap.i32(i32 %a)			%bswap = call i32 @llvm.bswap.i32(i32 %a)
	store i32 %bswap, i32* %dst, align 1			store i32 %bswap, i32* %dst, align 1

	%bswap2 = shl i32 %bswap, 2 ; incur an extra use to the bswap			%bswap2 = shl i32 %bswap, 2 ; incur an extra use to the bswap

	ret void			ret void
	}			}

	define void @var_bswap_store_i64(i64 %a, i64* %dst) {			define void @var_bswap_store_i64(i64 %a, i64* %dst) {
	; X64-LABEL: 'var_bswap_store_i64'			; X64-LABEL: 'var_bswap_store_i64'
	craig.topperUnsubmitted Not Done Reply Inline Actions These check lines vanished and were not replaced craig.topper: These check lines vanished and were not replaced
	; X64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)			; X64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)
	; X64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i64 %bswap, i64* %dst, align 1			; X64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i64 %bswap, i64* %dst, align 1
	; X64-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void			; X64-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
	;			;
	; X86-LABEL: 'var_bswap_store_i64'			; X64-MOVBE-LABEL: 'var_bswap_store_i64'
	; X86-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)
	; X86-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store i64 %bswap, i64* %dst, align 1			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i64 %bswap, i64* %dst, align 1
	; X86-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
				;
				; X64-FASTMOVBE-LABEL: 'var_bswap_store_i64'
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i64 %bswap, i64* %dst, align 1
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
				;
				; X32-LABEL: 'var_bswap_store_i64'
				; X32-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)
				; X32-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store i64 %bswap, i64* %dst, align 1
				; X32-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
				;
				; X32-MOVBE-LABEL: 'var_bswap_store_i64'
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store i64 %bswap, i64* %dst, align 1
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
				;
				; X32-FASTMOVBE-LABEL: 'var_bswap_store_i64'
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store i64 %bswap, i64* %dst, align 1
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
	;			;
	%bswap = call i64 @llvm.bswap.i64(i64 %a)			%bswap = call i64 @llvm.bswap.i64(i64 %a)
	store i64 %bswap, i64* %dst, align 1			store i64 %bswap, i64* %dst, align 1

	ret void			ret void
	}			}
	define void @var_bswap_store_i64_extrause(i64 %a, i64* %dst) {			define void @var_bswap_store_i64_extrause(i64 %a, i64* %dst) {
	; X64-LABEL: 'var_bswap_store_i64_extrause'			; X64-LABEL: 'var_bswap_store_i64_extrause'
	; X64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)			; X64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)
	; X64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i64 %bswap, i64* %dst, align 1			; X64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i64 %bswap, i64* %dst, align 1
	; X64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap2 = shl i64 %bswap, 2			; X64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap2 = shl i64 %bswap, 2
	; X64-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void			; X64-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
	;			;
	; X86-LABEL: 'var_bswap_store_i64_extrause'			; X64-MOVBE-LABEL: 'var_bswap_store_i64_extrause'
	; X86-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)
	; X86-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store i64 %bswap, i64* %dst, align 1			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i64 %bswap, i64* %dst, align 1
	; X86-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %bswap2 = shl i64 %bswap, 2			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap2 = shl i64 %bswap, 2
	; X86-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
				;
				; X64-FASTMOVBE-LABEL: 'var_bswap_store_i64_extrause'
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i64 %bswap, i64* %dst, align 1
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap2 = shl i64 %bswap, 2
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
				;
				; X32-LABEL: 'var_bswap_store_i64_extrause'
				; X32-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)
				; X32-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store i64 %bswap, i64* %dst, align 1
				; X32-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %bswap2 = shl i64 %bswap, 2
				; X32-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
				;
				; X32-MOVBE-LABEL: 'var_bswap_store_i64_extrause'
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store i64 %bswap, i64* %dst, align 1
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %bswap2 = shl i64 %bswap, 2
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
				;
				; X32-FASTMOVBE-LABEL: 'var_bswap_store_i64_extrause'
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store i64 %bswap, i64* %dst, align 1
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %bswap2 = shl i64 %bswap, 2
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
	;			;
	%bswap = call i64 @llvm.bswap.i64(i64 %a)			%bswap = call i64 @llvm.bswap.i64(i64 %a)
	store i64 %bswap, i64* %dst, align 1			store i64 %bswap, i64* %dst, align 1

	%bswap2 = shl i64 %bswap, 2 ; incur an extra use to the bswap			%bswap2 = shl i64 %bswap, 2 ; incur an extra use to the bswap

	ret void			ret void
	}			}

	define void @var_bswap_store_i128(i128 %a, i128* %dst) {			define void @var_bswap_store_i128(i128 %a, i128* %dst) {
	; X64-LABEL: 'var_bswap_store_i128'			; X64-LABEL: 'var_bswap_store_i128'
	craig.topperUnsubmitted Not Done Reply Inline Actions Same here craig.topper: Same here
	; X64-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)			; X64-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)
	; X64-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store i128 %bswap, i128* %dst, align 1			; X64-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store i128 %bswap, i128* %dst, align 1
	; X64-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void			; X64-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
	;			;
	; X86-LABEL: 'var_bswap_store_i128'			; X64-MOVBE-LABEL: 'var_bswap_store_i128'
	; X86-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)
	; X86-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store i128 %bswap, i128* %dst, align 1			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store i128 %bswap, i128* %dst, align 1
	; X86-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
				;
				; X64-FASTMOVBE-LABEL: 'var_bswap_store_i128'
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store i128 %bswap, i128* %dst, align 1
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
				;
				; X32-LABEL: 'var_bswap_store_i128'
				; X32-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)
				; X32-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store i128 %bswap, i128* %dst, align 1
				; X32-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
				;
				; X32-MOVBE-LABEL: 'var_bswap_store_i128'
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store i128 %bswap, i128* %dst, align 1
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
				;
				; X32-FASTMOVBE-LABEL: 'var_bswap_store_i128'
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store i128 %bswap, i128* %dst, align 1
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
	;			;
	%bswap = call i128 @llvm.bswap.i128(i128 %a)			%bswap = call i128 @llvm.bswap.i128(i128 %a)
	store i128 %bswap, i128* %dst, align 1			store i128 %bswap, i128* %dst, align 1

	ret void			ret void
	}			}
	define void @var_bswap_store_i128_extrause(i128 %a, i128* %dst) {			define void @var_bswap_store_i128_extrause(i128 %a, i128* %dst) {
	; X64-LABEL: 'var_bswap_store_i128_extrause'			; X64-LABEL: 'var_bswap_store_i128_extrause'
	; X64-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)			; X64-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)
	; X64-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store i128 %bswap, i128* %dst, align 1			; X64-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store i128 %bswap, i128* %dst, align 1
	; X64-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %bswap2 = shl i128 %bswap, 2			; X64-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %bswap2 = shl i128 %bswap, 2
	; X64-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void			; X64-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
	;			;
	; X86-LABEL: 'var_bswap_store_i128_extrause'			; X64-MOVBE-LABEL: 'var_bswap_store_i128_extrause'
	; X86-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)
	; X86-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store i128 %bswap, i128* %dst, align 1			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store i128 %bswap, i128* %dst, align 1
	; X86-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %bswap2 = shl i128 %bswap, 2			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %bswap2 = shl i128 %bswap, 2
	; X86-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
				;
				; X64-FASTMOVBE-LABEL: 'var_bswap_store_i128_extrause'
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store i128 %bswap, i128* %dst, align 1
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %bswap2 = shl i128 %bswap, 2
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
				;
				; X32-LABEL: 'var_bswap_store_i128_extrause'
				; X32-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)
				; X32-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store i128 %bswap, i128* %dst, align 1
				; X32-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %bswap2 = shl i128 %bswap, 2
				; X32-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
				;
				; X32-MOVBE-LABEL: 'var_bswap_store_i128_extrause'
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store i128 %bswap, i128* %dst, align 1
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %bswap2 = shl i128 %bswap, 2
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
				;
				; X32-FASTMOVBE-LABEL: 'var_bswap_store_i128_extrause'
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store i128 %bswap, i128* %dst, align 1
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %bswap2 = shl i128 %bswap, 2
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret void
	;			;
	%bswap = call i128 @llvm.bswap.i128(i128 %a)			%bswap = call i128 @llvm.bswap.i128(i128 %a)
	store i128 %bswap, i128* %dst, align 1			store i128 %bswap, i128* %dst, align 1

	%bswap2 = shl i128 %bswap, 2 ; incur an extra use to the bswap			%bswap2 = shl i128 %bswap, 2 ; incur an extra use to the bswap

	ret void			ret void
	}			}

llvm/test/Analysis/CostModel/X86/bswap.ll

	; NOTE: Assertions have been autogenerated by utils/update_analyze_test_checks.py			; NOTE: Assertions have been autogenerated by utils/update_analyze_test_checks.py
	; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -cost-model -analyze \| FileCheck %s --check-prefixes=ALL,NOMOVBE,X64			; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -cost-model -analyze \| FileCheck %s --check-prefixes=ALL,X64
	; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -cost-model -analyze -mattr=+movbe \| FileCheck %s --check-prefixes=ALL,MOVBE,X64			; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -cost-model -analyze -mattr=+movbe \| FileCheck %s --check-prefixes=ALL,X64
	; RUN: opt < %s -mtriple=i686-unknown-linux-gnu -cost-model -analyze \| FileCheck %s --check-prefixes=ALL,NOMOVBE,X86			; RUN: opt < %s -mtriple=i686-unknown-linux-gnu -cost-model -analyze \| FileCheck %s --check-prefixes=ALL,X86
	; RUN: opt < %s -mtriple=i686-unknown-linux-gnu -cost-model -analyze -mattr=+movbe \| FileCheck %s --check-prefixes=ALL,MOVBE,X86			; RUN: opt < %s -mtriple=i686-unknown-linux-gnu -cost-model -analyze -mattr=+movbe \| FileCheck %s --check-prefixes=ALL,X86

	declare i16 @llvm.bswap.i16(i16)			declare i16 @llvm.bswap.i16(i16)
	declare i32 @llvm.bswap.i32(i32)			declare i32 @llvm.bswap.i32(i32)
	declare i64 @llvm.bswap.i64(i64)			declare i64 @llvm.bswap.i64(i64)
	declare i128 @llvm.bswap.i128(i128)			declare i128 @llvm.bswap.i128(i128)

	; Verify the cost of scalar bswap instructions.			; Verify the cost of scalar bswap instructions.

	define i16 @var_bswap_i16(i16 %a) {			define i16 @var_bswap_i16(i16 %a) {
	; NOMOVBE-LABEL: 'var_bswap_i16'			; ALL-LABEL: 'var_bswap_i16'
	; NOMOVBE-NEXT: Cost Model: Found an estimated cost of 10 for instruction: %bswap = call i16 @llvm.bswap.i16(i16 %a)			; ALL-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i16 @llvm.bswap.i16(i16 %a)
	; NOMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i16 %bswap			; ALL-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i16 %bswap
	;
	; MOVBE-LABEL: 'var_bswap_i16'
	; MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i16 @llvm.bswap.i16(i16 %a)
	; MOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i16 %bswap
	;			;
	%bswap = call i16 @llvm.bswap.i16(i16 %a)			%bswap = call i16 @llvm.bswap.i16(i16 %a)
	ret i16 %bswap			ret i16 %bswap
	}			}

	define i32 @var_bswap_i32(i32 %a) {			define i32 @var_bswap_i32(i32 %a) {
	; ALL-LABEL: 'var_bswap_i32'			; ALL-LABEL: 'var_bswap_i32'
	; ALL-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i32 @llvm.bswap.i32(i32 %a)			; ALL-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i32 @llvm.bswap.i32(i32 %a)
	; ALL-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 %bswap			; ALL-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 %bswap
	;			;
	%bswap = call i32 @llvm.bswap.i32(i32 %a)			%bswap = call i32 @llvm.bswap.i32(i32 %a)
	ret i32 %bswap			ret i32 %bswap
	}			}

	define i64 @var_bswap_i64(i64 %a) {			define i64 @var_bswap_i64(i64 %a) {
	; X64-LABEL: 'var_bswap_i64'			; X64-LABEL: 'var_bswap_i64'
	; X64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)			; X64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)
	; X64-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i64 %bswap			; X64-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i64 %bswap
	;			;
	; X86-LABEL: 'var_bswap_i64'			; X86-LABEL: 'var_bswap_i64'
	; X86-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)			; X86-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)
	; X86-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i64 %bswap			; X86-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i64 %bswap
	;			;
	%bswap = call i64 @llvm.bswap.i64(i64 %a)			%bswap = call i64 @llvm.bswap.i64(i64 %a)
	ret i64 %bswap			ret i64 %bswap
	}			}

	define i128 @var_bswap_i128(i128 %a) {			define i128 @var_bswap_i128(i128 %a) {
	; X64-LABEL: 'var_bswap_i128'			; X64-LABEL: 'var_bswap_i128'
	; X64-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)			; X64-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)
	; X64-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i128 %bswap			; X64-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i128 %bswap
	;			;
	; X86-LABEL: 'var_bswap_i128'			; X86-LABEL: 'var_bswap_i128'
	; X86-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)			; X86-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)
	; X86-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i128 %bswap			; X86-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i128 %bswap
	;			;
	%bswap = call i128 @llvm.bswap.i128(i128 %a)			%bswap = call i128 @llvm.bswap.i128(i128 %a)
	ret i128 %bswap			ret i128 %bswap
	}			}

llvm/test/Analysis/CostModel/X86/load-bswap.ll

	; NOTE: Assertions have been autogenerated by utils/update_analyze_test_checks.py			; NOTE: Assertions have been autogenerated by utils/update_analyze_test_checks.py
	; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -cost-model -analyze \| FileCheck %s --check-prefixes=ALL,NOMOVBE,X64			; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -cost-model -analyze \| FileCheck %s --check-prefixes=ALL,X64
	; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -cost-model -analyze -mattr=+movbe \| FileCheck %s --check-prefixes=ALL,MOVBE,X64			; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -cost-model -analyze -mattr=+movbe \| FileCheck %s --check-prefixes=ALL,X64-MOVBE
	; RUN: opt < %s -mtriple=i686-unknown-linux-gnu -cost-model -analyze \| FileCheck %s --check-prefixes=ALL,NOMOVBE,X86			; RUN: opt < %s -mtriple=x86_64-unknown-linux-gnu -cost-model -analyze -mattr=+movbe,+fast-movbe \| FileCheck %s --check-prefixes=ALL,X64-FASTMOVBE
	; RUN: opt < %s -mtriple=i686-unknown-linux-gnu -cost-model -analyze -mattr=+movbe \| FileCheck %s --check-prefixes=ALL,MOVBE,X86
				; RUN: opt < %s -mtriple=i686-unknown-linux-gnu -cost-model -analyze \| FileCheck %s --check-prefixes=ALL,X32
				; RUN: opt < %s -mtriple=i686-unknown-linux-gnu -cost-model -analyze -mattr=+movbe \| FileCheck %s --check-prefixes=ALL,X32-MOVBE
				; RUN: opt < %s -mtriple=i686-unknown-linux-gnu -cost-model -analyze -mattr=+movbe,+fast-movbe \| FileCheck %s --check-prefixes=ALL,X32-FASTMOVBE

	declare i16 @llvm.bswap.i16(i16)			declare i16 @llvm.bswap.i16(i16)
	declare i32 @llvm.bswap.i32(i32)			declare i32 @llvm.bswap.i32(i32)
	declare i64 @llvm.bswap.i64(i64)			declare i64 @llvm.bswap.i64(i64)
	declare i128 @llvm.bswap.i128(i128)			declare i128 @llvm.bswap.i128(i128)

	define i16 @var_load_bswap_i16(i16* %src) {			define i16 @var_load_bswap_i16(i16* %src) {
	; NOMOVBE-LABEL: 'var_load_bswap_i16'			; X64-LABEL: 'var_load_bswap_i16'
	; NOMOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %a = load i16, i16* %src, align 1			; X64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %a = load i16, i16* %src, align 1
	; NOMOVBE-NEXT: Cost Model: Found an estimated cost of 10 for instruction: %bswap = call i16 @llvm.bswap.i16(i16 %a)			; X64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i16 @llvm.bswap.i16(i16 %a)
	; NOMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i16 %bswap			; X64-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i16 %bswap
	;			;
	; MOVBE-LABEL: 'var_load_bswap_i16'			; X64-MOVBE-LABEL: 'var_load_bswap_i16'
	; MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %a = load i16, i16* %src, align 1			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %a = load i16, i16* %src, align 1
	; MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i16 @llvm.bswap.i16(i16 %a)			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i16 @llvm.bswap.i16(i16 %a)
	; MOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i16 %bswap			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i16 %bswap
				;
				; X64-FASTMOVBE-LABEL: 'var_load_bswap_i16'
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %a = load i16, i16* %src, align 1
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %bswap = call i16 @llvm.bswap.i16(i16 %a)
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i16 %bswap
				;
				; X32-LABEL: 'var_load_bswap_i16'
				; X32-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %a = load i16, i16* %src, align 1
				; X32-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i16 @llvm.bswap.i16(i16 %a)
				; X32-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i16 %bswap
				;
				; X32-MOVBE-LABEL: 'var_load_bswap_i16'
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %a = load i16, i16* %src, align 1
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i16 @llvm.bswap.i16(i16 %a)
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i16 %bswap
				;
				; X32-FASTMOVBE-LABEL: 'var_load_bswap_i16'
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %a = load i16, i16* %src, align 1
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %bswap = call i16 @llvm.bswap.i16(i16 %a)
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i16 %bswap
	;			;
	%a = load i16, i16* %src, align 1			%a = load i16, i16* %src, align 1
	%bswap = call i16 @llvm.bswap.i16(i16 %a)			%bswap = call i16 @llvm.bswap.i16(i16 %a)

	ret i16 %bswap			ret i16 %bswap
	}			}
	define i16 @var_load_bswap_i16_extrause(i16* %src, i16* %clobberdst) {			define i16 @var_load_bswap_i16_extrause(i16* %src, i16* %clobberdst) {
	; NOMOVBE-LABEL: 'var_load_bswap_i16_extrause'			; ALL-LABEL: 'var_load_bswap_i16_extrause'
	; NOMOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %a = load i16, i16* %src, align 1			; ALL-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %a = load i16, i16* %src, align 1
	; NOMOVBE-NEXT: Cost Model: Found an estimated cost of 10 for instruction: %bswap = call i16 @llvm.bswap.i16(i16 %a)			; ALL-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i16 @llvm.bswap.i16(i16 %a)
	; NOMOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %a2 = shl i16 %a, 2			; ALL-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %a2 = shl i16 %a, 2
	; NOMOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i16 %a2, i16* %clobberdst, align 1			; ALL-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i16 %a2, i16* %clobberdst, align 1
	; NOMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i16 %bswap			; ALL-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i16 %bswap
	;
	; MOVBE-LABEL: 'var_load_bswap_i16_extrause'
	; MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %a = load i16, i16* %src, align 1
	; MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i16 @llvm.bswap.i16(i16 %a)
	; MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %a2 = shl i16 %a, 2
	; MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i16 %a2, i16* %clobberdst, align 1
	; MOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i16 %bswap
	;			;
	%a = load i16, i16* %src, align 1			%a = load i16, i16* %src, align 1
	%bswap = call i16 @llvm.bswap.i16(i16 %a)			%bswap = call i16 @llvm.bswap.i16(i16 %a)

	%a2 = shl i16 %a, 2 ; incur an extra use to the load			%a2 = shl i16 %a, 2 ; incur an extra use to the load
	store i16 %a2, i16* %clobberdst, align 1			store i16 %a2, i16* %clobberdst, align 1

	ret i16 %bswap			ret i16 %bswap
	}			}

	define i32 @var_load_bswap_i32(i32* %src) {			define i32 @var_load_bswap_i32(i32* %src) {
	; ALL-LABEL: 'var_load_bswap_i32'			; X64-LABEL: 'var_load_bswap_i32'
	; ALL-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %a = load i32, i32* %src, align 1			; X64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %a = load i32, i32* %src, align 1
	; ALL-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i32 @llvm.bswap.i32(i32 %a)			; X64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i32 @llvm.bswap.i32(i32 %a)
	; ALL-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 %bswap			; X64-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 %bswap
				;
				; X64-MOVBE-LABEL: 'var_load_bswap_i32'
				; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %a = load i32, i32* %src, align 1
				; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i32 @llvm.bswap.i32(i32 %a)
				; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 %bswap
				;
				; X64-FASTMOVBE-LABEL: 'var_load_bswap_i32'
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %a = load i32, i32* %src, align 1
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %bswap = call i32 @llvm.bswap.i32(i32 %a)
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 %bswap
				;
				; X32-LABEL: 'var_load_bswap_i32'
				; X32-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %a = load i32, i32* %src, align 1
				; X32-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i32 @llvm.bswap.i32(i32 %a)
				; X32-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 %bswap
				;
				; X32-MOVBE-LABEL: 'var_load_bswap_i32'
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %a = load i32, i32* %src, align 1
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i32 @llvm.bswap.i32(i32 %a)
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 %bswap
				;
				; X32-FASTMOVBE-LABEL: 'var_load_bswap_i32'
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %a = load i32, i32* %src, align 1
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %bswap = call i32 @llvm.bswap.i32(i32 %a)
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 %bswap
	;			;
	%a = load i32, i32* %src, align 1			%a = load i32, i32* %src, align 1
	%bswap = call i32 @llvm.bswap.i32(i32 %a)			%bswap = call i32 @llvm.bswap.i32(i32 %a)

	ret i32 %bswap			ret i32 %bswap
	}			}
	define i32 @var_load_bswap_i32_extrause(i32* %src, i32* %clobberdst) {			define i32 @var_load_bswap_i32_extrause(i32* %src, i32* %clobberdst) {
	; ALL-LABEL: 'var_load_bswap_i32_extrause'			; ALL-LABEL: 'var_load_bswap_i32_extrause'
	Show All 13 Lines
	}			}

	define i64 @var_load_bswap_i64(i64* %src) {			define i64 @var_load_bswap_i64(i64* %src) {
	; X64-LABEL: 'var_load_bswap_i64'			; X64-LABEL: 'var_load_bswap_i64'
	; X64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %a = load i64, i64* %src, align 1			; X64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %a = load i64, i64* %src, align 1
	; X64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)			; X64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)
	; X64-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i64 %bswap			; X64-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i64 %bswap
	;			;
	; X86-LABEL: 'var_load_bswap_i64'			; X64-MOVBE-LABEL: 'var_load_bswap_i64'
	; X86-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %a = load i64, i64* %src, align 1			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %a = load i64, i64* %src, align 1
	; X86-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)
	; X86-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i64 %bswap			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i64 %bswap
				;
				; X64-FASTMOVBE-LABEL: 'var_load_bswap_i64'
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %a = load i64, i64* %src, align 1
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i64 %bswap
				;
				; X32-LABEL: 'var_load_bswap_i64'
				; X32-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %a = load i64, i64* %src, align 1
				; X32-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)
				; X32-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i64 %bswap
				;
				; X32-MOVBE-LABEL: 'var_load_bswap_i64'
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %a = load i64, i64* %src, align 1
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i64 %bswap
				;
				; X32-FASTMOVBE-LABEL: 'var_load_bswap_i64'
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %a = load i64, i64* %src, align 1
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i64 %bswap
	;			;
	RKSimonUnsubmitted Not Done Reply Inline Actions Script being stupid again - you'll need to fix your prefixes RKSimon: Script being stupid again - you'll need to fix your prefixes
	lebedev.riAuthorUnsubmitted Not Done Reply Inline Actions UGH, i thought i did :( We need to disable FileCheck strict mode for x86 tests. lebedev.ri: UGH, i thought i did :( We need to disable FileCheck strict mode for x86 tests.
	%a = load i64, i64* %src, align 1			%a = load i64, i64* %src, align 1
	%bswap = call i64 @llvm.bswap.i64(i64 %a)			%bswap = call i64 @llvm.bswap.i64(i64 %a)

	ret i64 %bswap			ret i64 %bswap
	}			}
	define i64 @var_load_bswap_i64_extrause(i64* %src, i64* %clobberdst) {			define i64 @var_load_bswap_i64_extrause(i64* %src, i64* %clobberdst) {
	; X64-LABEL: 'var_load_bswap_i64_extrause'			; X64-LABEL: 'var_load_bswap_i64_extrause'
	; X64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %a = load i64, i64* %src, align 1			; X64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %a = load i64, i64* %src, align 1
	; X64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)			; X64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)
	; X64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %a2 = shl i64 %a, 2			; X64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %a2 = shl i64 %a, 2
	; X64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i64 %a2, i64* %clobberdst, align 1			; X64-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i64 %a2, i64* %clobberdst, align 1
	; X64-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i64 %bswap			; X64-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i64 %bswap
	;			;
	; X86-LABEL: 'var_load_bswap_i64_extrause'			; X64-MOVBE-LABEL: 'var_load_bswap_i64_extrause'
	; X86-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %a = load i64, i64* %src, align 1			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %a = load i64, i64* %src, align 1
	; X86-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)
	; X86-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %a2 = shl i64 %a, 2			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %a2 = shl i64 %a, 2
	; X86-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store i64 %a2, i64* %clobberdst, align 1			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i64 %a2, i64* %clobberdst, align 1
	; X86-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i64 %bswap			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i64 %bswap
				;
				; X64-FASTMOVBE-LABEL: 'var_load_bswap_i64_extrause'
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %a = load i64, i64* %src, align 1
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %a2 = shl i64 %a, 2
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 1 for instruction: store i64 %a2, i64* %clobberdst, align 1
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i64 %bswap
				;
				; X32-LABEL: 'var_load_bswap_i64_extrause'
				; X32-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %a = load i64, i64* %src, align 1
				; X32-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)
				; X32-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %a2 = shl i64 %a, 2
				; X32-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store i64 %a2, i64* %clobberdst, align 1
				; X32-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i64 %bswap
				;
				; X32-MOVBE-LABEL: 'var_load_bswap_i64_extrause'
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %a = load i64, i64* %src, align 1
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %a2 = shl i64 %a, 2
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store i64 %a2, i64* %clobberdst, align 1
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i64 %bswap
				;
				; X32-FASTMOVBE-LABEL: 'var_load_bswap_i64_extrause'
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %a = load i64, i64* %src, align 1
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %bswap = call i64 @llvm.bswap.i64(i64 %a)
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %a2 = shl i64 %a, 2
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store i64 %a2, i64* %clobberdst, align 1
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i64 %bswap
	;			;
	%a = load i64, i64* %src, align 1			%a = load i64, i64* %src, align 1
	%bswap = call i64 @llvm.bswap.i64(i64 %a)			%bswap = call i64 @llvm.bswap.i64(i64 %a)

	%a2 = shl i64 %a, 2 ; incur an extra use to the load			%a2 = shl i64 %a, 2 ; incur an extra use to the load
	store i64 %a2, i64* %clobberdst, align 1			store i64 %a2, i64* %clobberdst, align 1

	ret i64 %bswap			ret i64 %bswap
	}			}

	define i128 @var_load_bswap_i128(i128* %src) {			define i128 @var_load_bswap_i128(i128* %src) {
	; X64-LABEL: 'var_load_bswap_i128'			; X64-LABEL: 'var_load_bswap_i128'
	craig.topperUnsubmitted Not Done Reply Inline Actions And here craig.topper: And here
	; X64-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %a = load i128, i128* %src, align 1			; X64-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %a = load i128, i128* %src, align 1
	; X64-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)			; X64-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)
	; X64-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i128 %bswap			; X64-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i128 %bswap
	;			;
	; X86-LABEL: 'var_load_bswap_i128'			; X64-MOVBE-LABEL: 'var_load_bswap_i128'
	; X86-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %a = load i128, i128* %src, align 1			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %a = load i128, i128* %src, align 1
	; X86-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)
	; X86-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i128 %bswap			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i128 %bswap
				;
				; X64-FASTMOVBE-LABEL: 'var_load_bswap_i128'
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %a = load i128, i128* %src, align 1
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i128 %bswap
				;
				; X32-LABEL: 'var_load_bswap_i128'
				; X32-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %a = load i128, i128* %src, align 1
				; X32-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)
				; X32-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i128 %bswap
				;
				; X32-MOVBE-LABEL: 'var_load_bswap_i128'
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %a = load i128, i128* %src, align 1
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i128 %bswap
				;
				; X32-FASTMOVBE-LABEL: 'var_load_bswap_i128'
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %a = load i128, i128* %src, align 1
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i128 %bswap
	;			;
	%a = load i128, i128* %src, align 1			%a = load i128, i128* %src, align 1
	%bswap = call i128 @llvm.bswap.i128(i128 %a)			%bswap = call i128 @llvm.bswap.i128(i128 %a)

	ret i128 %bswap			ret i128 %bswap
	}			}
	define i128 @var_load_bswap_i128_extrause(i128* %src, i128* %clobberdst) {			define i128 @var_load_bswap_i128_extrause(i128* %src, i128* %clobberdst) {
	; X64-LABEL: 'var_load_bswap_i128_extrause'			; X64-LABEL: 'var_load_bswap_i128_extrause'
	; X64-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %a = load i128, i128* %src, align 1			; X64-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %a = load i128, i128* %src, align 1
	; X64-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)			; X64-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)
	; X64-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %a2 = shl i128 %a, 2			; X64-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %a2 = shl i128 %a, 2
	; X64-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store i128 %a2, i128* %clobberdst, align 1			; X64-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store i128 %a2, i128* %clobberdst, align 1
	; X64-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i128 %bswap			; X64-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i128 %bswap
	;			;
	; X86-LABEL: 'var_load_bswap_i128_extrause'			; X64-MOVBE-LABEL: 'var_load_bswap_i128_extrause'
	; X86-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %a = load i128, i128* %src, align 1			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %a = load i128, i128* %src, align 1
	; X86-NEXT: Cost Model: Found an estimated cost of 8 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)
	; X86-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %a2 = shl i128 %a, 2			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %a2 = shl i128 %a, 2
	; X86-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store i128 %a2, i128* %clobberdst, align 1			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store i128 %a2, i128* %clobberdst, align 1
	; X86-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i128 %bswap			; X64-MOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i128 %bswap
				;
				; X64-FASTMOVBE-LABEL: 'var_load_bswap_i128_extrause'
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %a = load i128, i128* %src, align 1
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %a2 = shl i128 %a, 2
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 2 for instruction: store i128 %a2, i128* %clobberdst, align 1
				; X64-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i128 %bswap
				;
				; X32-LABEL: 'var_load_bswap_i128_extrause'
				; X32-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %a = load i128, i128* %src, align 1
				; X32-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)
				; X32-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %a2 = shl i128 %a, 2
				; X32-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store i128 %a2, i128* %clobberdst, align 1
				; X32-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i128 %bswap
				;
				; X32-MOVBE-LABEL: 'var_load_bswap_i128_extrause'
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %a = load i128, i128* %src, align 1
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %a2 = shl i128 %a, 2
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store i128 %a2, i128* %clobberdst, align 1
				; X32-MOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i128 %bswap
				;
				; X32-FASTMOVBE-LABEL: 'var_load_bswap_i128_extrause'
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %a = load i128, i128* %src, align 1
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %bswap = call i128 @llvm.bswap.i128(i128 %a)
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %a2 = shl i128 %a, 2
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 4 for instruction: store i128 %a2, i128* %clobberdst, align 1
				; X32-FASTMOVBE-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i128 %bswap
	;			;
	%a = load i128, i128* %src, align 1			%a = load i128, i128* %src, align 1
	%bswap = call i128 @llvm.bswap.i128(i128 %a)			%bswap = call i128 @llvm.bswap.i128(i128 %a)

	%a2 = shl i128 %a, 2 ; incur an extra use to the load			%a2 = shl i128 %a, 2 ; incur an extra use to the load
	store i128 %a2, i128* %clobberdst, align 1			store i128 %a2, i128* %clobberdst, align 1

	ret i128 %bswap			ret i128 %bswap
	}			}

This is an archive of the discontinued LLVM Phabricator instance.

[X86] Improve costmodel for scalar byte swaps
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 343832

llvm/lib/Target/X86/X86.td

llvm/lib/Target/X86/X86Subtarget.h

llvm/lib/Target/X86/X86TargetTransformInfo.cpp

llvm/test/Analysis/CostModel/X86/bswap-store.ll

llvm/test/Analysis/CostModel/X86/bswap.ll

llvm/test/Analysis/CostModel/X86/load-bswap.ll

This is an archive of the discontinued LLVM Phabricator instance.

[X86] Improve costmodel for scalar byte swapsClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 343832

llvm/lib/Target/X86/X86.td

llvm/lib/Target/X86/X86Subtarget.h

llvm/lib/Target/X86/X86TargetTransformInfo.cpp

llvm/test/Analysis/CostModel/X86/bswap-store.ll

llvm/test/Analysis/CostModel/X86/bswap.ll

llvm/test/Analysis/CostModel/X86/load-bswap.ll

[X86] Improve costmodel for scalar byte swaps
ClosedPublic