Diff 515375

llvm/lib/Target/AArch64/AArch64TargetTransformInfo.cpp

Show First 20 Lines • Show All 517 Lines • ▼ Show 20 Lines	if ((LT.second.getScalarType() == MVT::f32 \|\|
Cost += getIntrinsicInstrCost(Attrs1, CostKind);		Cost += getIntrinsicInstrCost(Attrs1, CostKind);
IntrinsicCostAttributes Attrs2(IsSigned ? Intrinsic::smax : Intrinsic::umax,		IntrinsicCostAttributes Attrs2(IsSigned ? Intrinsic::smax : Intrinsic::umax,
LegalTy, {LegalTy, LegalTy});		LegalTy, {LegalTy, LegalTy});
Cost += getIntrinsicInstrCost(Attrs2, CostKind);		Cost += getIntrinsicInstrCost(Attrs2, CostKind);
return LT.first * Cost;		return LT.first * Cost;
}		}
break;		break;
}		}
		case Intrinsic::fshl:
		case Intrinsic::fshr: {
		if (ICA.getArgs().empty())
		break;

		// TODO: Add handling for fshl where third argument is not a constant.
		dmgreenUnsubmitted Not Done Reply Inline Actions I would just combine fshr into a single patch I think. They seem to be essentially the same. dmgreen: I would just combine fshr into a single patch I think. They seem to be essentially the same.
		const TTI::OperandValueInfo OpInfoZ = TTI::getOperandInfo(ICA.getArgs()[2]);
		if (!OpInfoZ.isConstant())
		break;

		const auto LegalisationCost = getTypeLegalizationCost(RetTy);
		if (OpInfoZ.isUniform()) {
		// FIXME: The costs could be lower if the codegen is better.
		static const CostTblEntry FshlTbl[] = {
		dmgreenUnsubmitted Not Done Reply Inline Actions Can you add i16 and i8 vector types too? And 64bit vector sizes like v2i32. Can you add a FIXME that the cost could be lower if the codegen was better. dmgreen: Can you add i16 and i8 vector types too? And 64bit vector sizes like v2i32. Can you add a FIXME…
		{Intrinsic::fshl, MVT::v4i32, 3}, // ushr + shl + orr
		{Intrinsic::fshl, MVT::v2i64, 3}, {Intrinsic::fshl, MVT::v16i8, 4},
		{Intrinsic::fshl, MVT::v8i16, 4}, {Intrinsic::fshl, MVT::v2i32, 3},
		{Intrinsic::fshl, MVT::v8i8, 4}, {Intrinsic::fshl, MVT::v4i16, 4}};
		// Costs for both fshl & fshr are the same, so just pass Intrinsic::fshl
		// to avoid having to duplicate the costs.
		const auto *Entry =
		CostTableLookup(FshlTbl, Intrinsic::fshl, LegalisationCost.second);
		if (Entry)
		return LegalisationCost.first * Entry->Cost;
		dmgreenUnsubmitted Not Done Reply Inline Actions Why does this not use RetTy, as above? dmgreen: Why does this not use RetTy, as above?
		dmgreenUnsubmitted Not Done Reply Inline Actions You could just pass Intrinsic::fshl if the costs are expected to be the same, so long as there is a comment explaining it. It would help reduce the size of the table. dmgreen: You could just pass Intrinsic::fshl if the costs are expected to be the same, so long as there…
		fhahnUnsubmitted Not Done Reply Inline Actions done in the committed version. fhahn: done in the committed version.
		}

		dmgreenUnsubmitted Not Done Reply Inline Actions What is this guarding against? Other vector types? dmgreen: What is this guarding against? Other vector types?
		auto TyL = getTypeLegalizationCost(RetTy);
		dmgreenUnsubmitted Not Done Reply Inline Actions Is this correct, that it's breaking if it is an integer type? dmgreen: Is this correct, that it's breaking if it is an integer type?
		if (!RetTy->isIntegerTy())
		break;

		// Estimate cost manually, as types like i8 and i16 will get promoted to
		// i32 and CostTableLookup will ignore the extra conversion cost.
		bool HigherCost = (RetTy->getScalarSizeInBits() != 32 &&
		RetTy->getScalarSizeInBits() < 64) \|\|
		dmgreenUnsubmitted Not Done Reply Inline Actions `!= 64` is covered by `< 64` dmgreen: `!= 64` is covered by `< 64`
		(RetTy->getScalarSizeInBits() % 64 != 0);
		unsigned ExtraCost = HigherCost ? 1 : 0;
		dmgreenUnsubmitted Not Done Reply Inline Actions I don't thinks its "equal to i8 or i16", it should be "not equal to i32 or i64", and any smaller sizes should get a larger cost. Or any larger sizes not a multiple of 64. dmgreen: I don't thinks its "equal to i8 or i16", it should be "not equal to i32 or i64", and any…
		if (RetTy->getScalarSizeInBits() == 32 \|\|
		RetTy->getScalarSizeInBits() == 64)
		ExtraCost = 0; // fhsl/fshr for i32 and i64 can be lowered to a single
		// extr instruction.
		else if (HigherCost)
		ExtraCost = 1;
		else
		dmgreenUnsubmitted Not Done Reply Inline Actions There is a debug message left here, which is coming out in the tests too. dmgreen: There is a debug message left here, which is coming out in the tests too.
		break;
		dmgreenUnsubmitted Not Done Reply Inline Actions I think this can just be `unsigned Cost = HigherCost ? 1 : 0`. The comment would be good to keep though. Maybe call it "ExtraCost" too, to show it's an addition not the base cost. dmgreen: I think this can just be `unsigned Cost = HigherCost ? 1 : 0`. The comment would be good to…
		fhahnUnsubmitted Not Done Reply Inline Actions I tried that but it was causing some changes so I kept the original version for now. I updated the name. fhahn: I tried that but it was causing some changes so I kept the original version for now. I updated…
		return TyL.first + ExtraCost;
		}
default:		default:
		dmgreenUnsubmitted Not Done Reply Inline Actions Do you have any opinions of whether this should be `TyL.first * Cost` (with a Cost of 1/2) or `TyL.first + Cost` (with a cost of 0/1)? It might capture the "extra shift" a little better, for integer types at least. As far as I can see NumElements is always 1 here? dmgreen: Do you have any opinions of whether this should be `TyL.first * Cost` (with a Cost of 1/2) or…
		zjaffalAuthorUnsubmitted Done Reply Inline Actions As far as I can see NumElements is always 1 here? I was trying to see if the same code works for vector instructions but I think it might be easier to do that in a different patch given the following code is an overestimate for the true cost. Do you have any opinions of whether this should be TyL.first * Cost (with a Cost of 1/2) or TyL.first + Cost (with a cost of 0/1)? It might capture the "extra shift" a little better, for integer types at least. I will test it now and see if there are any differences. zjaffal: >As far as I can see NumElements is always 1 here? I was trying to see if the same code works…
break;		break;
}		}
return BaseT::getIntrinsicInstrCost(ICA, CostKind);		return BaseT::getIntrinsicInstrCost(ICA, CostKind);
}		}

/// The function will remove redundant reinterprets casting in the presence		/// The function will remove redundant reinterprets casting in the presence
/// of the control flow		/// of the control flow
static std::optional<Instruction *> processPhiNode(InstCombiner &IC,		static std::optional<Instruction *> processPhiNode(InstCombiner &IC,
▲ Show 20 Lines • Show All 2,967 Lines • Show Last 20 Lines

llvm/test/Analysis/CostModel/AArch64/fshl.ll

; NOTE: Assertions have been autogenerated by utils/update_analyze_test_checks.py UTC_ARGS: --version 2		; NOTE: Assertions have been autogenerated by utils/update_analyze_test_checks.py UTC_ARGS: --version 2
; RUN: opt -passes="print<cost-model>" -disable-output -mtriple=arm64-apple-ios < %s 2>&1 \| FileCheck %s		; RUN: opt -passes="print<cost-model>" -disable-output -mtriple=arm64-apple-ios < %s 2>&1 \| FileCheck %s

target datalayout = "e-m:e-i8:8:32-i16:16:32-i64:64-i128:128-n32:64-S128"		target datalayout = "e-m:e-i8:8:32-i16:16:32-i64:64-i128:128-n32:64-S128"
		dmgreenUnsubmitted Not Done Reply Inline Actions If there isn't already one, then adding a llvm.fshr version of this test file would be good too. dmgreen: If there isn't already one, then adding a llvm.fshr version of this test file would be good too.
		fhahnUnsubmitted Not Done Reply Inline Actions yep, there's `fhsr.ll` which is a copy of `fshl.ll` with fshl replaced by fshr. fhahn: yep, there's `fhsr.ll` which is a copy of `fshl.ll` with fshl replaced by fshr.

define i8 @fshl_i8_3rd_arg_const(i8 %a, i8 %b) {		define i8 @fshl_i8_3rd_arg_const(i8 %a, i8 %b) {
; CHECK-LABEL: 'fshl_i8_3rd_arg_const'		; CHECK-LABEL: 'fshl_i8_3rd_arg_const'
; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %fshl = tail call i8 @llvm.fshl.i8(i8 %a, i8 %b, i8 9)		; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %fshl = tail call i8 @llvm.fshl.i8(i8 %a, i8 %b, i8 9)
; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i8 %fshl		; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i8 %fshl
;		;
entry:		entry:
%fshl = tail call i8 @llvm.fshl.i8(i8 %a, i8 %b, i8 9)		%fshl = tail call i8 @llvm.fshl.i8(i8 %a, i8 %b, i8 9)
ret i8 %fshl		ret i8 %fshl
}		}

define i8 @fshl_i8_3rd_arg_var(i8 %a, i8 %b, i8 %c) {		define i8 @fshl_i8_3rd_arg_var(i8 %a, i8 %b, i8 %c) {
; CHECK-LABEL: 'fshl_i8_3rd_arg_var'		; CHECK-LABEL: 'fshl_i8_3rd_arg_var'
; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %fshl = tail call i8 @llvm.fshl.i8(i8 %a, i8 %b, i8 %c)		; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %fshl = tail call i8 @llvm.fshl.i8(i8 %a, i8 %b, i8 %c)
; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i8 %fshl		; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i8 %fshl
;		;
entry:		entry:
%fshl = tail call i8 @llvm.fshl.i8(i8 %a, i8 %b, i8 %c)		%fshl = tail call i8 @llvm.fshl.i8(i8 %a, i8 %b, i8 %c)
ret i8 %fshl		ret i8 %fshl
}		}

declare i8 @llvm.fshl.i8(i8, i8, i8)		declare i8 @llvm.fshl.i8(i8, i8, i8)

define i16 @fshl_i16(i16 %a, i16 %b) {		define i16 @fshl_i16(i16 %a, i16 %b) {
; CHECK-LABEL: 'fshl_i16'		; CHECK-LABEL: 'fshl_i16'
; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %fshl = tail call i16 @llvm.fshl.i16(i16 %a, i16 %b, i16 9)		; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %fshl = tail call i16 @llvm.fshl.i16(i16 %a, i16 %b, i16 9)
; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i16 %fshl		; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i16 %fshl
;		;
entry:		entry:
%fshl = tail call i16 @llvm.fshl.i16(i16 %a, i16 %b, i16 9)		%fshl = tail call i16 @llvm.fshl.i16(i16 %a, i16 %b, i16 9)
ret i16 %fshl		ret i16 %fshl
}		}

declare i16 @llvm.fshl.i16(i16, i16, i16)		declare i16 @llvm.fshl.i16(i16, i16, i16)

define i32 @fshl_i32_3rd_arg_const(i32 %a, i32 %b) {		define i32 @fshl_i32_3rd_arg_const(i32 %a, i32 %b) {
; CHECK-LABEL: 'fshl_i32_3rd_arg_const'		; CHECK-LABEL: 'fshl_i32_3rd_arg_const'
; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %fshl = tail call i32 @llvm.fshl.i32(i32 %a, i32 %b, i32 9)		; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %fshl = tail call i32 @llvm.fshl.i32(i32 %a, i32 %b, i32 9)
; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 %fshl		; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 %fshl
;		;
entry:		entry:
%fshl = tail call i32 @llvm.fshl.i32(i32 %a, i32 %b, i32 9)		%fshl = tail call i32 @llvm.fshl.i32(i32 %a, i32 %b, i32 9)
ret i32 %fshl		ret i32 %fshl
}		}

define i32 @fshl_i32_3rd_arg_var(i32 %a, i32 %b, i32 %c) {		define i32 @fshl_i32_3rd_arg_var(i32 %a, i32 %b, i32 %c) {
; CHECK-LABEL: 'fshl_i32_3rd_arg_var'		; CHECK-LABEL: 'fshl_i32_3rd_arg_var'
; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %fshl = tail call i32 @llvm.fshl.i32(i32 %a, i32 %b, i32 %c)		; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %fshl = tail call i32 @llvm.fshl.i32(i32 %a, i32 %b, i32 %c)
; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 %fshl		; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 %fshl
;		;
entry:		entry:
%fshl = tail call i32 @llvm.fshl.i32(i32 %a, i32 %b, i32 %c)		%fshl = tail call i32 @llvm.fshl.i32(i32 %a, i32 %b, i32 %c)
ret i32 %fshl		ret i32 %fshl
}		}

declare i32 @llvm.fshl.i32(i32, i32, i32)		declare i32 @llvm.fshl.i32(i32, i32, i32)

define i64 @fshl_i64_3rd_arg_const(i64 %a, i64 %b) {		define i64 @fshl_i64_3rd_arg_const(i64 %a, i64 %b) {
; CHECK-LABEL: 'fshl_i64_3rd_arg_const'		; CHECK-LABEL: 'fshl_i64_3rd_arg_const'
; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %fshl = tail call i64 @llvm.fshl.i64(i64 %a, i64 %b, i64 9)		; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %fshl = tail call i64 @llvm.fshl.i64(i64 %a, i64 %b, i64 9)
; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i64 %fshl		; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i64 %fshl
;		;
entry:		entry:
%fshl = tail call i64 @llvm.fshl.i64(i64 %a, i64 %b, i64 9)		%fshl = tail call i64 @llvm.fshl.i64(i64 %a, i64 %b, i64 9)
ret i64 %fshl		ret i64 %fshl
}		}

define i64 @fshl_i64_3rd_arg_var(i64 %a, i64 %b, i64 %c) {		define i64 @fshl_i64_3rd_arg_var(i64 %a, i64 %b, i64 %c) {
; CHECK-LABEL: 'fshl_i64_3rd_arg_var'		; CHECK-LABEL: 'fshl_i64_3rd_arg_var'
; CHECK-NEXT: Cost Model: Found an estimated cost of 15 for instruction: %fshl = tail call i64 @llvm.fshl.i64(i64 %a, i64 %b, i64 %c)		; CHECK-NEXT: Cost Model: Found an estimated cost of 15 for instruction: %fshl = tail call i64 @llvm.fshl.i64(i64 %a, i64 %b, i64 %c)
; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i64 %fshl		; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i64 %fshl
;		;
entry:		entry:
%fshl = tail call i64 @llvm.fshl.i64(i64 %a, i64 %b, i64 %c)		%fshl = tail call i64 @llvm.fshl.i64(i64 %a, i64 %b, i64 %c)
ret i64 %fshl		ret i64 %fshl
}		}

declare i64 @llvm.fshl.i64(i64, i64, i64)		declare i64 @llvm.fshl.i64(i64, i64, i64)

define i19 @fshl_i19(i19 %a, i19 %b) {		define i19 @fshl_i19(i19 %a, i19 %b) {
; CHECK-LABEL: 'fshl_i19'		; CHECK-LABEL: 'fshl_i19'
; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %fshl = tail call i19 @llvm.fshl.i19(i19 %a, i19 %b, i19 9)		; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %fshl = tail call i19 @llvm.fshl.i19(i19 %a, i19 %b, i19 9)
; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i19 %fshl		; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i19 %fshl
;		;
entry:		entry:
%fshl = tail call i19 @llvm.fshl.i19(i19 %a, i19 %b, i19 9)		%fshl = tail call i19 @llvm.fshl.i19(i19 %a, i19 %b, i19 9)
ret i19 %fshl		ret i19 %fshl
}		}

declare i19 @llvm.fshl.i19(i19, i19, i19)		declare i19 @llvm.fshl.i19(i19, i19, i19)


define <16 x i8> @fshl_v16i8_3rd_arg_vec_const_all_lanes_same(<16 x i8> %a, <16 x i8> %b) {		define <16 x i8> @fshl_v16i8_3rd_arg_vec_const_all_lanes_same(<16 x i8> %a, <16 x i8> %b) {
; CHECK-LABEL: 'fshl_v16i8_3rd_arg_vec_const_all_lanes_same'		; CHECK-LABEL: 'fshl_v16i8_3rd_arg_vec_const_all_lanes_same'
; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %fshl = tail call <16 x i8> @llvm.fshl.v16i8(<16 x i8> %a, <16 x i8> %b, <16 x i8> <i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3>)		; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %fshl = tail call <16 x i8> @llvm.fshl.v16i8(<16 x i8> %a, <16 x i8> %b, <16 x i8> <i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3>)
; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret <16 x i8> %fshl		; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret <16 x i8> %fshl
;		;
entry:		entry:
%fshl = tail call <16 x i8> @llvm.fshl.v16i8(<16 x i8> %a, <16 x i8> %b, <16 x i8> <i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3>)		%fshl = tail call <16 x i8> @llvm.fshl.v16i8(<16 x i8> %a, <16 x i8> %b, <16 x i8> <i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3>)
ret <16 x i8> %fshl		ret <16 x i8> %fshl
}		}

define <16 x i8> @fshl_v16i8_3rd_arg_vec_const_lanes_different(<16 x i8> %a, <16 x i8> %b) {		define <16 x i8> @fshl_v16i8_3rd_arg_vec_const_lanes_different(<16 x i8> %a, <16 x i8> %b) {
Show All 15 Lines	entry:
%fshl = tail call <16 x i8> @llvm.fshl.v16i8(<16 x i8> %a, <16 x i8> %b, <16 x i8> %c)		%fshl = tail call <16 x i8> @llvm.fshl.v16i8(<16 x i8> %a, <16 x i8> %b, <16 x i8> %c)
ret <16 x i8> %fshl		ret <16 x i8> %fshl
}		}

declare <16 x i8> @llvm.fshl.v16i8(<16 x i8>, <16 x i8>, <16 x i8>)		declare <16 x i8> @llvm.fshl.v16i8(<16 x i8>, <16 x i8>, <16 x i8>)

define <8 x i16> @fshl_v8i16_3rd_arg_vec_const_all_lanes_same(<8 x i16> %a, <8 x i16> %b) {		define <8 x i16> @fshl_v8i16_3rd_arg_vec_const_all_lanes_same(<8 x i16> %a, <8 x i16> %b) {
; CHECK-LABEL: 'fshl_v8i16_3rd_arg_vec_const_all_lanes_same'		; CHECK-LABEL: 'fshl_v8i16_3rd_arg_vec_const_all_lanes_same'
; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %fshl = tail call <8 x i16> @llvm.fshl.v8i16(<8 x i16> %a, <8 x i16> %b, <8 x i16> <i16 3, i16 3, i16 3, i16 3, i16 3, i16 3, i16 3, i16 3>)		; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %fshl = tail call <8 x i16> @llvm.fshl.v8i16(<8 x i16> %a, <8 x i16> %b, <8 x i16> <i16 3, i16 3, i16 3, i16 3, i16 3, i16 3, i16 3, i16 3>)
; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret <8 x i16> %fshl		; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret <8 x i16> %fshl
;		;
entry:		entry:
%fshl = tail call <8 x i16> @llvm.fshl.v8i16(<8 x i16> %a, <8 x i16> %b, <8 x i16> <i16 3, i16 3, i16 3, i16 3, i16 3, i16 3, i16 3, i16 3>)		%fshl = tail call <8 x i16> @llvm.fshl.v8i16(<8 x i16> %a, <8 x i16> %b, <8 x i16> <i16 3, i16 3, i16 3, i16 3, i16 3, i16 3, i16 3, i16 3>)
ret <8 x i16> %fshl		ret <8 x i16> %fshl
}		}

define <8 x i16> @fshl_v8i16_3rd_arg_vec_const_lanes_different(<8 x i16> %a, <8 x i16> %b) {		define <8 x i16> @fshl_v8i16_3rd_arg_vec_const_lanes_different(<8 x i16> %a, <8 x i16> %b) {
Show All 15 Lines	entry:
%fshl = tail call <8 x i16> @llvm.fshl.v8i16(<8 x i16> %a, <8 x i16> %b, <8 x i16> %c)		%fshl = tail call <8 x i16> @llvm.fshl.v8i16(<8 x i16> %a, <8 x i16> %b, <8 x i16> %c)
ret <8 x i16> %fshl		ret <8 x i16> %fshl
}		}

declare <8 x i16> @llvm.fshl.v8i16(<8 x i16>, <8 x i16>, <8 x i16>)		declare <8 x i16> @llvm.fshl.v8i16(<8 x i16>, <8 x i16>, <8 x i16>)

define <4 x i32> @fshl_v4i32_3rd_arg_vec_const_all_lanes_same(<4 x i32> %a, <4 x i32> %b) {		define <4 x i32> @fshl_v4i32_3rd_arg_vec_const_all_lanes_same(<4 x i32> %a, <4 x i32> %b) {
; CHECK-LABEL: 'fshl_v4i32_3rd_arg_vec_const_all_lanes_same'		; CHECK-LABEL: 'fshl_v4i32_3rd_arg_vec_const_all_lanes_same'
; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %fshl = tail call <4 x i32> @llvm.fshl.v4i32(<4 x i32> %a, <4 x i32> %b, <4 x i32> <i32 3, i32 3, i32 3, i32 3>)		; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %fshl = tail call <4 x i32> @llvm.fshl.v4i32(<4 x i32> %a, <4 x i32> %b, <4 x i32> <i32 3, i32 3, i32 3, i32 3>)
; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret <4 x i32> %fshl		; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret <4 x i32> %fshl
;		;
entry:		entry:
%fshl = tail call <4 x i32> @llvm.fshl.v4i32(<4 x i32> %a, <4 x i32> %b, <4 x i32> <i32 3, i32 3, i32 3, i32 3>)		%fshl = tail call <4 x i32> @llvm.fshl.v4i32(<4 x i32> %a, <4 x i32> %b, <4 x i32> <i32 3, i32 3, i32 3, i32 3>)
ret <4 x i32> %fshl		ret <4 x i32> %fshl
}		}

define <4 x i32> @fshl_v4i32_3rd_arg_vec_const_lanes_different(<4 x i32> %a, <4 x i32> %b) {		define <4 x i32> @fshl_v4i32_3rd_arg_vec_const_lanes_different(<4 x i32> %a, <4 x i32> %b) {
Show All 15 Lines	entry:
%fshl = tail call <4 x i32> @llvm.fshl.v4i32(<4 x i32> %a, <4 x i32> %b, <4 x i32> %c)		%fshl = tail call <4 x i32> @llvm.fshl.v4i32(<4 x i32> %a, <4 x i32> %b, <4 x i32> %c)
ret <4 x i32> %fshl		ret <4 x i32> %fshl
}		}

declare <4 x i32> @llvm.fshl.v4i32(<4 x i32>, <4 x i32>, <4 x i32>)		declare <4 x i32> @llvm.fshl.v4i32(<4 x i32>, <4 x i32>, <4 x i32>)

define <2 x i64> @fshl_v2i64_3rd_arg_vec_const_all_lanes_same(<2 x i64> %a, <2 x i64> %b) {		define <2 x i64> @fshl_v2i64_3rd_arg_vec_const_all_lanes_same(<2 x i64> %a, <2 x i64> %b) {
; CHECK-LABEL: 'fshl_v2i64_3rd_arg_vec_const_all_lanes_same'		; CHECK-LABEL: 'fshl_v2i64_3rd_arg_vec_const_all_lanes_same'
; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %fshl = tail call <2 x i64> @llvm.fshl.v2i64(<2 x i64> %a, <2 x i64> %b, <2 x i64> <i64 1, i64 1>)		; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %fshl = tail call <2 x i64> @llvm.fshl.v2i64(<2 x i64> %a, <2 x i64> %b, <2 x i64> <i64 1, i64 1>)
; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret <2 x i64> %fshl		; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret <2 x i64> %fshl
;		;
entry:		entry:
%fshl = tail call <2 x i64> @llvm.fshl.v4i64(<2 x i64> %a, <2 x i64> %b, <2 x i64> <i64 1, i64 1>)		%fshl = tail call <2 x i64> @llvm.fshl.v4i64(<2 x i64> %a, <2 x i64> %b, <2 x i64> <i64 1, i64 1>)
		dmgreenUnsubmitted Not Done Reply Inline Actions v2i64 dmgreen: v2i64
ret <2 x i64> %fshl		ret <2 x i64> %fshl
}		}

define <2 x i64> @fshl_v2i64_3rd_arg_vec_const_lanes_different(<2 x i64> %a, <2 x i64> %b) {		define <2 x i64> @fshl_v2i64_3rd_arg_vec_const_lanes_different(<2 x i64> %a, <2 x i64> %b) {
; CHECK-LABEL: 'fshl_v2i64_3rd_arg_vec_const_lanes_different'		; CHECK-LABEL: 'fshl_v2i64_3rd_arg_vec_const_lanes_different'
; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %fshl = tail call <2 x i64> @llvm.fshl.v2i64(<2 x i64> %a, <2 x i64> %b, <2 x i64> <i64 1, i64 2>)		; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %fshl = tail call <2 x i64> @llvm.fshl.v2i64(<2 x i64> %a, <2 x i64> %b, <2 x i64> <i64 1, i64 2>)
; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret <2 x i64> %fshl		; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret <2 x i64> %fshl
;		;
Show All 16 Lines

define <4 x i30> @fshl_v4i30_3rd_arg_var(<4 x i30> %a, <4 x i30> %b, <4 x i30> %c) {		define <4 x i30> @fshl_v4i30_3rd_arg_var(<4 x i30> %a, <4 x i30> %b, <4 x i30> %c) {
; CHECK-LABEL: 'fshl_v4i30_3rd_arg_var'		; CHECK-LABEL: 'fshl_v4i30_3rd_arg_var'
; CHECK-NEXT: Cost Model: Found an estimated cost of 36 for instruction: %fshl = tail call <4 x i30> @llvm.fshl.v4i30(<4 x i30> %a, <4 x i30> %b, <4 x i30> %c)		; CHECK-NEXT: Cost Model: Found an estimated cost of 36 for instruction: %fshl = tail call <4 x i30> @llvm.fshl.v4i30(<4 x i30> %a, <4 x i30> %b, <4 x i30> %c)
; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret <4 x i30> %fshl		; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret <4 x i30> %fshl
;		;
entry:		entry:
%fshl = tail call <4 x i30> @llvm.fshl.v4i30(<4 x i30> %a, <4 x i30> %b, <4 x i30> %c)		%fshl = tail call <4 x i30> @llvm.fshl.v4i30(<4 x i30> %a, <4 x i30> %b, <4 x i30> %c)
ret <4 x i30> %fshl		ret <4 x i30> %fshl
		dmgreenUnsubmitted Not Done Reply Inline Actions Should this be with equal operands and i66? Otherwise it would not get past the isUniform check. Or is it intended to check the other code? We are probably getting into pretty uncommon cases here either way :) dmgreen: Should this be with equal operands and i66? Otherwise it would not get past the isUniform check.
}		}

declare <4 x i30> @llvm.fshl.v4i30(<4 x i30>, <4 x i30>, <4 x i30>)		declare <4 x i30> @llvm.fshl.v4i30(<4 x i30>, <4 x i30>, <4 x i30>)

		dmgreenUnsubmitted Not Done Reply Inline Actions Maybe add a test for i128 too? It might be relatively common from crypto functions and would help test one of the codepaths. dmgreen: Maybe add a test for i128 too? It might be relatively common from crypto functions and would…
		fhahnUnsubmitted Not Done Reply Inline Actions I added i128 tests in 8d4f92601c3c1fcc6ecc10352e2234b5c064e954 fhahn: I added i128 tests in 8d4f92601c3c1fcc6ecc10352e2234b5c064e954
define <2 x i66> @fshl_v2i66_3rd_arg_vec_const_lanes_different(<2 x i66> %a, <2 x i66> %b) {		define <2 x i66> @fshl_v2i66_3rd_arg_vec_const_lanes_different(<2 x i66> %a, <2 x i66> %b) {
; CHECK-LABEL: 'fshl_v2i66_3rd_arg_vec_const_lanes_different'		; CHECK-LABEL: 'fshl_v2i66_3rd_arg_vec_const_lanes_different'
; CHECK-NEXT: Cost Model: Found an estimated cost of 24 for instruction: %fshl = tail call <2 x i66> @llvm.fshl.v2i66(<2 x i66> %a, <2 x i66> %b, <2 x i66> <i66 1, i66 2>)		; CHECK-NEXT: Cost Model: Found an estimated cost of 24 for instruction: %fshl = tail call <2 x i66> @llvm.fshl.v2i66(<2 x i66> %a, <2 x i66> %b, <2 x i66> <i66 1, i66 2>)
; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret <2 x i66> %fshl		; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret <2 x i66> %fshl
;		;
entry:		entry:
%fshl = tail call <2 x i66> @llvm.fshl.v4i66(<2 x i66> %a, <2 x i66> %b, <2 x i66> <i66 1, i66 2>)		%fshl = tail call <2 x i66> @llvm.fshl.v4i66(<2 x i66> %a, <2 x i66> %b, <2 x i66> <i66 1, i66 2>)
ret <2 x i66> %fshl		ret <2 x i66> %fshl
}		}
declare <2 x i66> @llvm.fshl.v4i66(<2 x i66>, <2 x i66>, <2 x i66>)		declare <2 x i66> @llvm.fshl.v4i66(<2 x i66>, <2 x i66>, <2 x i66>)

define i66 @fshl_i66(i66 %a, i66 %b) {		define i66 @fshl_i66(i66 %a, i66 %b) {
; CHECK-LABEL: 'fshl_i66'		; CHECK-LABEL: 'fshl_i66'
; CHECK-NEXT: Cost Model: Found an estimated cost of 12 for instruction: %fshl = tail call i66 @llvm.fshl.i66(i66 %a, i66 %b, i66 9)		; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %fshl = tail call i66 @llvm.fshl.i66(i66 %a, i66 %b, i66 9)
; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i66 %fshl		; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i66 %fshl
;		;
entry:		entry:
%fshl = tail call i66 @llvm.fshl.i66(i66 %a, i66 %b, i66 9)		%fshl = tail call i66 @llvm.fshl.i66(i66 %a, i66 %b, i66 9)
ret i66 %fshl		ret i66 %fshl
}		}

declare i66 @llvm.fshl.i66(i66, i66, i66)		declare i66 @llvm.fshl.i66(i66, i66, i66)
Show All 23 Lines

llvm/test/Analysis/CostModel/AArch64/fshr.ll

; NOTE: Assertions have been autogenerated by utils/update_analyze_test_checks.py UTC_ARGS: --version 2		; NOTE: Assertions have been autogenerated by utils/update_analyze_test_checks.py UTC_ARGS: --version 2
; RUN: opt -passes="print<cost-model>" -disable-output -mtriple=arm64-apple-ios < %s 2>&1 \| FileCheck %s		; RUN: opt -passes="print<cost-model>" -disable-output -mtriple=arm64-apple-ios < %s 2>&1 \| FileCheck %s

target datalayout = "e-m:e-i8:8:32-i16:16:32-i64:64-i128:128-n32:64-S128"		target datalayout = "e-m:e-i8:8:32-i16:16:32-i64:64-i128:128-n32:64-S128"

define i8 @fshr_i8_3rd_arg_const(i8 %a, i8 %b) {		define i8 @fshr_i8_3rd_arg_const(i8 %a, i8 %b) {
; CHECK-LABEL: 'fshr_i8_3rd_arg_const'		; CHECK-LABEL: 'fshr_i8_3rd_arg_const'
; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %fshr = tail call i8 @llvm.fshr.i8(i8 %a, i8 %b, i8 9)		; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %fshr = tail call i8 @llvm.fshr.i8(i8 %a, i8 %b, i8 9)
; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i8 %fshr		; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i8 %fshr
;		;
entry:		entry:
%fshr = tail call i8 @llvm.fshr.i8(i8 %a, i8 %b, i8 9)		%fshr = tail call i8 @llvm.fshr.i8(i8 %a, i8 %b, i8 9)
ret i8 %fshr		ret i8 %fshr
}		}

define i8 @fshr_i8_3rd_arg_var(i8 %a, i8 %b, i8 %c) {		define i8 @fshr_i8_3rd_arg_var(i8 %a, i8 %b, i8 %c) {
; CHECK-LABEL: 'fshr_i8_3rd_arg_var'		; CHECK-LABEL: 'fshr_i8_3rd_arg_var'
; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %fshr = tail call i8 @llvm.fshr.i8(i8 %a, i8 %b, i8 %c)		; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %fshr = tail call i8 @llvm.fshr.i8(i8 %a, i8 %b, i8 %c)
; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i8 %fshr		; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i8 %fshr
;		;
entry:		entry:
%fshr = tail call i8 @llvm.fshr.i8(i8 %a, i8 %b, i8 %c)		%fshr = tail call i8 @llvm.fshr.i8(i8 %a, i8 %b, i8 %c)
ret i8 %fshr		ret i8 %fshr
}		}

declare i8 @llvm.fshr.i8(i8, i8, i8)		declare i8 @llvm.fshr.i8(i8, i8, i8)

define i16 @fshr_i16(i16 %a, i16 %b) {		define i16 @fshr_i16(i16 %a, i16 %b) {
; CHECK-LABEL: 'fshr_i16'		; CHECK-LABEL: 'fshr_i16'
; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %fshr = tail call i16 @llvm.fshr.i16(i16 %a, i16 %b, i16 9)		; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %fshr = tail call i16 @llvm.fshr.i16(i16 %a, i16 %b, i16 9)
; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i16 %fshr		; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i16 %fshr
;		;
entry:		entry:
%fshr = tail call i16 @llvm.fshr.i16(i16 %a, i16 %b, i16 9)		%fshr = tail call i16 @llvm.fshr.i16(i16 %a, i16 %b, i16 9)
ret i16 %fshr		ret i16 %fshr
}		}

declare i16 @llvm.fshr.i16(i16, i16, i16)		declare i16 @llvm.fshr.i16(i16, i16, i16)

define i32 @fshr_i32_3rd_arg_const(i32 %a, i32 %b) {		define i32 @fshr_i32_3rd_arg_const(i32 %a, i32 %b) {
; CHECK-LABEL: 'fshr_i32_3rd_arg_const'		; CHECK-LABEL: 'fshr_i32_3rd_arg_const'
; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %fshr = tail call i32 @llvm.fshr.i32(i32 %a, i32 %b, i32 9)		; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %fshr = tail call i32 @llvm.fshr.i32(i32 %a, i32 %b, i32 9)
; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 %fshr		; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 %fshr
;		;
entry:		entry:
%fshr = tail call i32 @llvm.fshr.i32(i32 %a, i32 %b, i32 9)		%fshr = tail call i32 @llvm.fshr.i32(i32 %a, i32 %b, i32 9)
ret i32 %fshr		ret i32 %fshr
}		}

define i32 @fshr_i32_3rd_arg_var(i32 %a, i32 %b, i32 %c) {		define i32 @fshr_i32_3rd_arg_var(i32 %a, i32 %b, i32 %c) {
; CHECK-LABEL: 'fshr_i32_3rd_arg_var'		; CHECK-LABEL: 'fshr_i32_3rd_arg_var'
; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %fshr = tail call i32 @llvm.fshr.i32(i32 %a, i32 %b, i32 %c)		; CHECK-NEXT: Cost Model: Found an estimated cost of 9 for instruction: %fshr = tail call i32 @llvm.fshr.i32(i32 %a, i32 %b, i32 %c)
; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 %fshr		; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i32 %fshr
;		;
entry:		entry:
%fshr = tail call i32 @llvm.fshr.i32(i32 %a, i32 %b, i32 %c)		%fshr = tail call i32 @llvm.fshr.i32(i32 %a, i32 %b, i32 %c)
ret i32 %fshr		ret i32 %fshr
}		}

declare i32 @llvm.fshr.i32(i32, i32, i32)		declare i32 @llvm.fshr.i32(i32, i32, i32)

define i64 @fshr_i64_3rd_arg_const(i64 %a, i64 %b) {		define i64 @fshr_i64_3rd_arg_const(i64 %a, i64 %b) {
; CHECK-LABEL: 'fshr_i64_3rd_arg_const'		; CHECK-LABEL: 'fshr_i64_3rd_arg_const'
; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %fshr = tail call i64 @llvm.fshr.i64(i64 %a, i64 %b, i64 9)		; CHECK-NEXT: Cost Model: Found an estimated cost of 1 for instruction: %fshr = tail call i64 @llvm.fshr.i64(i64 %a, i64 %b, i64 9)
; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i64 %fshr		; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i64 %fshr
;		;
entry:		entry:
%fshr = tail call i64 @llvm.fshr.i64(i64 %a, i64 %b, i64 9)		%fshr = tail call i64 @llvm.fshr.i64(i64 %a, i64 %b, i64 9)
ret i64 %fshr		ret i64 %fshr
}		}

define i64 @fshr_i64_3rd_arg_var(i64 %a, i64 %b, i64 %c) {		define i64 @fshr_i64_3rd_arg_var(i64 %a, i64 %b, i64 %c) {
; CHECK-LABEL: 'fshr_i64_3rd_arg_var'		; CHECK-LABEL: 'fshr_i64_3rd_arg_var'
; CHECK-NEXT: Cost Model: Found an estimated cost of 15 for instruction: %fshr = tail call i64 @llvm.fshr.i64(i64 %a, i64 %b, i64 %c)		; CHECK-NEXT: Cost Model: Found an estimated cost of 15 for instruction: %fshr = tail call i64 @llvm.fshr.i64(i64 %a, i64 %b, i64 %c)
; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i64 %fshr		; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i64 %fshr
;		;
entry:		entry:
%fshr = tail call i64 @llvm.fshr.i64(i64 %a, i64 %b, i64 %c)		%fshr = tail call i64 @llvm.fshr.i64(i64 %a, i64 %b, i64 %c)
ret i64 %fshr		ret i64 %fshr
}		}

declare i64 @llvm.fshr.i64(i64, i64, i64)		declare i64 @llvm.fshr.i64(i64, i64, i64)

define i19 @fshr_i19(i19 %a, i19 %b) {		define i19 @fshr_i19(i19 %a, i19 %b) {
; CHECK-LABEL: 'fshr_i19'		; CHECK-LABEL: 'fshr_i19'
; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %fshr = tail call i19 @llvm.fshr.i19(i19 %a, i19 %b, i19 9)		; CHECK-NEXT: Cost Model: Found an estimated cost of 2 for instruction: %fshr = tail call i19 @llvm.fshr.i19(i19 %a, i19 %b, i19 9)
; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i19 %fshr		; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i19 %fshr
;		;
entry:		entry:
%fshr = tail call i19 @llvm.fshr.i19(i19 %a, i19 %b, i19 9)		%fshr = tail call i19 @llvm.fshr.i19(i19 %a, i19 %b, i19 9)
ret i19 %fshr		ret i19 %fshr
}		}

declare i19 @llvm.fshr.i19(i19, i19, i19)		declare i19 @llvm.fshr.i19(i19, i19, i19)


define <16 x i8> @fshr_v16i8_3rd_arg_vec_const_all_lanes_same(<16 x i8> %a, <16 x i8> %b) {		define <16 x i8> @fshr_v16i8_3rd_arg_vec_const_all_lanes_same(<16 x i8> %a, <16 x i8> %b) {
; CHECK-LABEL: 'fshr_v16i8_3rd_arg_vec_const_all_lanes_same'		; CHECK-LABEL: 'fshr_v16i8_3rd_arg_vec_const_all_lanes_same'
; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %fshr = tail call <16 x i8> @llvm.fshr.v16i8(<16 x i8> %a, <16 x i8> %b, <16 x i8> <i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3>)		; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %fshr = tail call <16 x i8> @llvm.fshr.v16i8(<16 x i8> %a, <16 x i8> %b, <16 x i8> <i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3>)
; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret <16 x i8> %fshr		; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret <16 x i8> %fshr
;		;
entry:		entry:
%fshr = tail call <16 x i8> @llvm.fshr.v16i8(<16 x i8> %a, <16 x i8> %b, <16 x i8> <i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3>)		%fshr = tail call <16 x i8> @llvm.fshr.v16i8(<16 x i8> %a, <16 x i8> %b, <16 x i8> <i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3, i8 3>)
ret <16 x i8> %fshr		ret <16 x i8> %fshr
}		}

define <16 x i8> @fshr_v16i8_3rd_arg_vec_const_lanes_different(<16 x i8> %a, <16 x i8> %b) {		define <16 x i8> @fshr_v16i8_3rd_arg_vec_const_lanes_different(<16 x i8> %a, <16 x i8> %b) {
Show All 15 Lines	entry:
%fshr = tail call <16 x i8> @llvm.fshr.v16i8(<16 x i8> %a, <16 x i8> %b, <16 x i8> %c)		%fshr = tail call <16 x i8> @llvm.fshr.v16i8(<16 x i8> %a, <16 x i8> %b, <16 x i8> %c)
ret <16 x i8> %fshr		ret <16 x i8> %fshr
}		}

declare <16 x i8> @llvm.fshr.v16i8(<16 x i8>, <16 x i8>, <16 x i8>)		declare <16 x i8> @llvm.fshr.v16i8(<16 x i8>, <16 x i8>, <16 x i8>)

define <8 x i16> @fshr_v8i16_3rd_arg_vec_const_all_lanes_same(<8 x i16> %a, <8 x i16> %b) {		define <8 x i16> @fshr_v8i16_3rd_arg_vec_const_all_lanes_same(<8 x i16> %a, <8 x i16> %b) {
; CHECK-LABEL: 'fshr_v8i16_3rd_arg_vec_const_all_lanes_same'		; CHECK-LABEL: 'fshr_v8i16_3rd_arg_vec_const_all_lanes_same'
; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %fshr = tail call <8 x i16> @llvm.fshr.v8i16(<8 x i16> %a, <8 x i16> %b, <8 x i16> <i16 3, i16 3, i16 3, i16 3, i16 3, i16 3, i16 3, i16 3>)		; CHECK-NEXT: Cost Model: Found an estimated cost of 4 for instruction: %fshr = tail call <8 x i16> @llvm.fshr.v8i16(<8 x i16> %a, <8 x i16> %b, <8 x i16> <i16 3, i16 3, i16 3, i16 3, i16 3, i16 3, i16 3, i16 3>)
; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret <8 x i16> %fshr		; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret <8 x i16> %fshr
;		;
entry:		entry:
%fshr = tail call <8 x i16> @llvm.fshr.v8i16(<8 x i16> %a, <8 x i16> %b, <8 x i16> <i16 3, i16 3, i16 3, i16 3, i16 3, i16 3, i16 3, i16 3>)		%fshr = tail call <8 x i16> @llvm.fshr.v8i16(<8 x i16> %a, <8 x i16> %b, <8 x i16> <i16 3, i16 3, i16 3, i16 3, i16 3, i16 3, i16 3, i16 3>)
ret <8 x i16> %fshr		ret <8 x i16> %fshr
}		}

define <8 x i16> @fshr_v8i16_3rd_arg_vec_const_lanes_different(<8 x i16> %a, <8 x i16> %b) {		define <8 x i16> @fshr_v8i16_3rd_arg_vec_const_lanes_different(<8 x i16> %a, <8 x i16> %b) {
Show All 15 Lines	entry:
%fshr = tail call <8 x i16> @llvm.fshr.v8i16(<8 x i16> %a, <8 x i16> %b, <8 x i16> %c)		%fshr = tail call <8 x i16> @llvm.fshr.v8i16(<8 x i16> %a, <8 x i16> %b, <8 x i16> %c)
ret <8 x i16> %fshr		ret <8 x i16> %fshr
}		}

declare <8 x i16> @llvm.fshr.v8i16(<8 x i16>, <8 x i16>, <8 x i16>)		declare <8 x i16> @llvm.fshr.v8i16(<8 x i16>, <8 x i16>, <8 x i16>)

define <4 x i32> @fshr_v4i32_3rd_arg_vec_const_all_lanes_same(<4 x i32> %a, <4 x i32> %b) {		define <4 x i32> @fshr_v4i32_3rd_arg_vec_const_all_lanes_same(<4 x i32> %a, <4 x i32> %b) {
; CHECK-LABEL: 'fshr_v4i32_3rd_arg_vec_const_all_lanes_same'		; CHECK-LABEL: 'fshr_v4i32_3rd_arg_vec_const_all_lanes_same'
; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %fshr = tail call <4 x i32> @llvm.fshr.v4i32(<4 x i32> %a, <4 x i32> %b, <4 x i32> <i32 3, i32 3, i32 3, i32 3>)		; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %fshr = tail call <4 x i32> @llvm.fshr.v4i32(<4 x i32> %a, <4 x i32> %b, <4 x i32> <i32 3, i32 3, i32 3, i32 3>)
; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret <4 x i32> %fshr		; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret <4 x i32> %fshr
;		;
entry:		entry:
%fshr = tail call <4 x i32> @llvm.fshr.v4i32(<4 x i32> %a, <4 x i32> %b, <4 x i32> <i32 3, i32 3, i32 3, i32 3>)		%fshr = tail call <4 x i32> @llvm.fshr.v4i32(<4 x i32> %a, <4 x i32> %b, <4 x i32> <i32 3, i32 3, i32 3, i32 3>)
ret <4 x i32> %fshr		ret <4 x i32> %fshr
}		}

define <4 x i32> @fshr_v4i32_3rd_arg_vec_const_lanes_different(<4 x i32> %a, <4 x i32> %b) {		define <4 x i32> @fshr_v4i32_3rd_arg_vec_const_lanes_different(<4 x i32> %a, <4 x i32> %b) {
Show All 15 Lines	entry:
%fshr = tail call <4 x i32> @llvm.fshr.v4i32(<4 x i32> %a, <4 x i32> %b, <4 x i32> %c)		%fshr = tail call <4 x i32> @llvm.fshr.v4i32(<4 x i32> %a, <4 x i32> %b, <4 x i32> %c)
ret <4 x i32> %fshr		ret <4 x i32> %fshr
}		}

declare <4 x i32> @llvm.fshr.v4i32(<4 x i32>, <4 x i32>, <4 x i32>)		declare <4 x i32> @llvm.fshr.v4i32(<4 x i32>, <4 x i32>, <4 x i32>)

define <2 x i64> @fshr_v2i64_3rd_arg_vec_const_all_lanes_same(<2 x i64> %a, <2 x i64> %b) {		define <2 x i64> @fshr_v2i64_3rd_arg_vec_const_all_lanes_same(<2 x i64> %a, <2 x i64> %b) {
; CHECK-LABEL: 'fshr_v2i64_3rd_arg_vec_const_all_lanes_same'		; CHECK-LABEL: 'fshr_v2i64_3rd_arg_vec_const_all_lanes_same'
; CHECK-NEXT: Cost Model: Found an estimated cost of 6 for instruction: %fshr = tail call <2 x i64> @llvm.fshr.v2i64(<2 x i64> %a, <2 x i64> %b, <2 x i64> <i64 1, i64 1>)		; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %fshr = tail call <2 x i64> @llvm.fshr.v2i64(<2 x i64> %a, <2 x i64> %b, <2 x i64> <i64 1, i64 1>)
; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret <2 x i64> %fshr		; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret <2 x i64> %fshr
;		;
entry:		entry:
%fshr = tail call <2 x i64> @llvm.fshr.v4i64(<2 x i64> %a, <2 x i64> %b, <2 x i64> <i64 1, i64 1>)		%fshr = tail call <2 x i64> @llvm.fshr.v4i64(<2 x i64> %a, <2 x i64> %b, <2 x i64> <i64 1, i64 1>)
ret <2 x i64> %fshr		ret <2 x i64> %fshr
}		}

define <2 x i64> @fshr_v2i64_3rd_arg_vec_const_lanes_different(<2 x i64> %a, <2 x i64> %b) {		define <2 x i64> @fshr_v2i64_3rd_arg_vec_const_lanes_different(<2 x i64> %a, <2 x i64> %b) {
Show All 38 Lines
entry:		entry:
%fshr = tail call <2 x i66> @llvm.fshr.v4i66(<2 x i66> %a, <2 x i66> %b, <2 x i66> <i66 1, i66 2>)		%fshr = tail call <2 x i66> @llvm.fshr.v4i66(<2 x i66> %a, <2 x i66> %b, <2 x i66> <i66 1, i66 2>)
ret <2 x i66> %fshr		ret <2 x i66> %fshr
}		}
declare <2 x i66> @llvm.fshr.v4i66(<2 x i66>, <2 x i66>, <2 x i66>)		declare <2 x i66> @llvm.fshr.v4i66(<2 x i66>, <2 x i66>, <2 x i66>)

define i66 @fshr_i66(i66 %a, i66 %b) {		define i66 @fshr_i66(i66 %a, i66 %b) {
; CHECK-LABEL: 'fshr_i66'		; CHECK-LABEL: 'fshr_i66'
; CHECK-NEXT: Cost Model: Found an estimated cost of 12 for instruction: %fshr = tail call i66 @llvm.fshr.i66(i66 %a, i66 %b, i66 9)		; CHECK-NEXT: Cost Model: Found an estimated cost of 3 for instruction: %fshr = tail call i66 @llvm.fshr.i66(i66 %a, i66 %b, i66 9)
; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i66 %fshr		; CHECK-NEXT: Cost Model: Found an estimated cost of 0 for instruction: ret i66 %fshr
;		;
entry:		entry:
%fshr = tail call i66 @llvm.fshr.i66(i66 %a, i66 %b, i66 9)		%fshr = tail call i66 @llvm.fshr.i66(i66 %a, i66 %b, i66 9)
ret i66 %fshr		ret i66 %fshr
}		}

declare i66 @llvm.fshr.i66(i66, i66, i66)		declare i66 @llvm.fshr.i66(i66, i66, i66)
Show All 23 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[AArch64] Improve fshl cost modeling if 3rd arg is constant.
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 515375

llvm/lib/Target/AArch64/AArch64TargetTransformInfo.cpp

llvm/test/Analysis/CostModel/AArch64/fshl.ll

llvm/test/Analysis/CostModel/AArch64/fshr.ll

This is an archive of the discontinued LLVM Phabricator instance.

[AArch64] Improve fshl cost modeling if 3rd arg is constant.ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 515375

llvm/lib/Target/AArch64/AArch64TargetTransformInfo.cpp

llvm/test/Analysis/CostModel/AArch64/fshl.ll

llvm/test/Analysis/CostModel/AArch64/fshr.ll

[AArch64] Improve fshl cost modeling if 3rd arg is constant.
ClosedPublic