Diff 110960

lib/Analysis/ValueTracking.cpp

Show First 20 Lines • Show All 2,190 Lines • ▼ Show 20 Lines	if (const auto *CLHS = dyn_cast<Constant>(U->getOperand(0)))
}		}

// Sub can have at most one carry bit. Thus we know that the output		// Sub can have at most one carry bit. Thus we know that the output
// is, at worst, one more bit than the inputs.		// is, at worst, one more bit than the inputs.
Tmp = ComputeNumSignBits(U->getOperand(0), Depth + 1, Q);		Tmp = ComputeNumSignBits(U->getOperand(0), Depth + 1, Q);
if (Tmp == 1) return 1; // Early out.		if (Tmp == 1) return 1; // Early out.
return std::min(Tmp, Tmp2)-1;		return std::min(Tmp, Tmp2)-1;

		case Instruction::Mul: {
		// The output of the Mul can at most twice the valid bits in the inputs.
		spatelUnsubmitted Done Reply Inline Actions can at -> can be at spatel: can at -> can be at
		Tmp = ComputeNumSignBits(U->getOperand(0), Depth + 1, Q);
		if (Tmp == 1) return 1; // Early out.
		Tmp2 = ComputeNumSignBits(U->getOperand(1), Depth + 1, Q);
		spatelUnsubmitted Done Reply Inline Actions It's poor to have variables named 'Tmp'. These can be locals now, so let's give these meaningful names - SignBitsOp0/SignBitsOp1 or something like that. spatel: It's poor to have variables named 'Tmp'. These can be locals now, so let's give these…
		if (Tmp2 == 1) return 1;
		unsigned OutValidBits = (TyBits - Tmp + 1) + (TyBits - Tmp2 + 1);
		return OutValidBits > TyBits ? 1 : TyBits - OutValidBits + 1;
		}

case Instruction::PHI: {		case Instruction::PHI: {
const PHINode *PN = cast<PHINode>(U);		const PHINode *PN = cast<PHINode>(U);
unsigned NumIncomingValues = PN->getNumIncomingValues();		unsigned NumIncomingValues = PN->getNumIncomingValues();
// Don't analyze large in-degree PHIs.		// Don't analyze large in-degree PHIs.
if (NumIncomingValues > 4) break;		if (NumIncomingValues > 4) break;
// Unreachable blocks may have zero-operand PHI nodes.		// Unreachable blocks may have zero-operand PHI nodes.
if (NumIncomingValues == 0) break;		if (NumIncomingValues == 0) break;

▲ Show 20 Lines • Show All 2,388 Lines • Show Last 20 Lines

lib/Transforms/InstCombine/InstCombineCasts.cpp

Show First 20 Lines • Show All 363 Lines • ▼ Show 20 Lines	if (ConstantInt *CI = dyn_cast<ConstantInt>(I->getOperand(1))) {
uint32_t BitWidth = Ty->getScalarSizeInBits();		uint32_t BitWidth = Ty->getScalarSizeInBits();
if (IC.MaskedValueIsZero(I->getOperand(0),		if (IC.MaskedValueIsZero(I->getOperand(0),
APInt::getHighBitsSet(OrigBitWidth, OrigBitWidth-BitWidth), 0, CxtI) &&		APInt::getHighBitsSet(OrigBitWidth, OrigBitWidth-BitWidth), 0, CxtI) &&
CI->getLimitedValue(BitWidth) < BitWidth) {		CI->getLimitedValue(BitWidth) < BitWidth) {
return canEvaluateTruncated(I->getOperand(0), Ty, IC, CxtI);		return canEvaluateTruncated(I->getOperand(0), Ty, IC, CxtI);
}		}
}		}
break;		break;
		case Instruction::AShr:
		// If this is a truncate of an arithmetic shr, we can truncate it to a
		// smaller ashr iff we know that all the bits from the sign bit of the
		// original type and the sign bit of the truncate type are similar.
		// TODO: It is enough to check that the bits we would be shifting in are
		// similar to sign bit of the truncate type.
		if (ConstantInt *CI = dyn_cast<ConstantInt>(I->getOperand(1))) {
		spatelUnsubmitted Done Reply Inline Actions Over in D36763, we're going to (or maybe already have) made the other shift cases splat-vector-friendly. Can you do the same here and add a vector test? spatel: Over in D36763, we're going to (or maybe already have) made the other shift cases splat-vector…
		uint32_t OrigBitWidth = OrigTy->getScalarSizeInBits();
		uint32_t BitWidth = Ty->getScalarSizeInBits();
		if (CI->getLimitedValue(BitWidth) < BitWidth &&
		OrigBitWidth - BitWidth <
		IC.ComputeNumSignBits(I->getOperand(0), 0, CxtI))
		return canEvaluateTruncated(I->getOperand(0), Ty, IC, CxtI);
		}
		break;
case Instruction::Trunc:		case Instruction::Trunc:
// trunc(trunc(x)) -> trunc(x)		// trunc(trunc(x)) -> trunc(x)
return true;		return true;
case Instruction::ZExt:		case Instruction::ZExt:
case Instruction::SExt:		case Instruction::SExt:
// trunc(ext(x)) -> ext(x) if the source type is smaller than the new dest		// trunc(ext(x)) -> ext(x) if the source type is smaller than the new dest
// trunc(ext(x)) -> trunc(x) if the source type is larger than the new dest		// trunc(ext(x)) -> trunc(x) if the source type is larger than the new dest
return true;		return true;
▲ Show 20 Lines • Show All 1,955 Lines • Show Last 20 Lines

lib/Transforms/InstCombine/InstCombineShifts.cpp

Show First 20 Lines • Show All 553 Lines • ▼ Show 20 Lines	if (match(Op1, m_APInt(ShAmtAPInt))) {
Value *X;		Value *X;
if (match(Op0, m_ZExt(m_Value(X)))) {		if (match(Op0, m_ZExt(m_Value(X)))) {
unsigned SrcWidth = X->getType()->getScalarSizeInBits();		unsigned SrcWidth = X->getType()->getScalarSizeInBits();
if (ShAmt < SrcWidth &&		if (ShAmt < SrcWidth &&
MaskedValueIsZero(X, APInt::getHighBitsSet(SrcWidth, ShAmt), 0, &I))		MaskedValueIsZero(X, APInt::getHighBitsSet(SrcWidth, ShAmt), 0, &I))
return new ZExtInst(Builder.CreateShl(X, ShAmt), Ty);		return new ZExtInst(Builder.CreateShl(X, ShAmt), Ty);
}		}

// (X >>u C) << C --> X & (-1 << C)		// (X >>u C) << C --> X & (-1 << C)
if (match(Op0, m_LShr(m_Value(X), m_Specific(Op1)))) {		// (X >>s C) << C --> X & (-1 << C)
		if (match(Op0, m_LShr(m_Value(X), m_Specific(Op1))) \|\|
		match(Op0, m_AShr(m_Value(X), m_Specific(Op1)))) {
		spatelUnsubmitted Not Done Reply Inline Actions Use 'm_Shr' to reduce the code. This change is independent of anything else, so I think it should go in first. http://rise4fun.com/Alive/lBi Here's a test you can use for that patch: define i8 @shishi(i8 %x) { %a = ashr i8 %x, 6 %b = shl i8 %a, 6 %extra_use_of_a = mul i8 %a, 5 %r = sdiv i8 %extra_use_of_a, %b ret i8 %r } spatel: Use 'm_Shr' to reduce the code. This change is independent of anything else, so I think it…
APInt Mask(APInt::getHighBitsSet(BitWidth, BitWidth - ShAmt));		APInt Mask(APInt::getHighBitsSet(BitWidth, BitWidth - ShAmt));
return BinaryOperator::CreateAnd(X, ConstantInt::get(Ty, Mask));		return BinaryOperator::CreateAnd(X, ConstantInt::get(Ty, Mask));
}		}

// Be careful about hiding shl instructions behind bit masks. They are used		// Be careful about hiding shl instructions behind bit masks. They are used
// to represent multiplies by a constant, and it is important that simple		// to represent multiplies by a constant, and it is important that simple
// arithmetic expressions are still recognizable by scalar evolution.		// arithmetic expressions are still recognizable by scalar evolution.
// The inexact versions are deferred to DAGCombine, so we don't hide shl		// The inexact versions are deferred to DAGCombine, so we don't hide shl
▲ Show 20 Lines • Show All 248 Lines • Show Last 20 Lines

lib/Transforms/InstCombine/InstCombineSimplifyDemanded.cpp

Show First 20 Lines • Show All 459 Lines • ▼ Show 20 Lines	if (match(I->getOperand(1), m_APInt(SA))) {
if (ShiftAmt)		if (ShiftAmt)
Known.Zero.setLowBits(ShiftAmt);		Known.Zero.setLowBits(ShiftAmt);
}		}
break;		break;
}		}
case Instruction::LShr: {		case Instruction::LShr: {
const APInt *SA;		const APInt *SA;
if (match(I->getOperand(1), m_APInt(SA))) {		if (match(I->getOperand(1), m_APInt(SA))) {
uint64_t ShiftAmt = SA->getLimitedValue(BitWidth-1);		uint32_t ShiftAmt = SA->getLimitedValue(BitWidth-1);
		spatelUnsubmitted Not Done Reply Inline Actions Why change this in this patch? Seem like that might be better as just 'unsigned', but either way, I think it's an independent diff. spatel: Why change this in this patch? Seem like that might be better as just 'unsigned', but either…
		aaboudAuthorUnsubmitted Not Done Reply Inline Actions I change it to uint32_t to be consistent with line 507 (the case for AShr). Sure, we can commit this separately. Do we need a review for this? Do you want to take care of it? or I should just commit it now? aaboud: I change it to uint32_t to be consistent with line 507 (the case for AShr). Sure, we can commit…
		spatelUnsubmitted Not Done Reply Inline Actions Ah, I see the LangRef says we're allowed to go up to 24 bits of width: http://llvm.org/docs/LangRef.html#integer-type So I guess it's ok to specify 32-bit here...or just change them all to 'unsigned'? Either way seems fine to me. Feel free to commit separately. spatel: Ah, I see the LangRef says we're allowed to go up to 24 bits of width: http://llvm.

// Unsigned shift right.		// Unsigned shift right.
APInt DemandedMaskIn(DemandedMask.shl(ShiftAmt));		APInt DemandedMaskIn(DemandedMask.shl(ShiftAmt));

// If the shift is exact, then it does demand the low bits (and knows that		// If the shift is exact, then it does demand the low bits (and knows that
// they are zero).		// they are zero).
if (cast<LShrOperator>(I)->isExact())		if (cast<LShrOperator>(I)->isExact())
DemandedMaskIn.setLowBits(ShiftAmt);		DemandedMaskIn.setLowBits(ShiftAmt);
Show All 39 Lines	if (match(I->getOperand(1), m_APInt(SA))) {
// If the shift is exact, then it does demand the low bits (and knows that		// If the shift is exact, then it does demand the low bits (and knows that
// they are zero).		// they are zero).
if (cast<AShrOperator>(I)->isExact())		if (cast<AShrOperator>(I)->isExact())
DemandedMaskIn.setLowBits(ShiftAmt);		DemandedMaskIn.setLowBits(ShiftAmt);

if (SimplifyDemandedBits(I, 0, DemandedMaskIn, Known, Depth + 1))		if (SimplifyDemandedBits(I, 0, DemandedMaskIn, Known, Depth + 1))
return I;		return I;

		unsigned SignBits = ComputeNumSignBits(I->getOperand(0), 0, CxtI);

assert(!Known.hasConflict() && "Bits known to be one AND zero?");		assert(!Known.hasConflict() && "Bits known to be one AND zero?");
// Compute the new bits that are at the top now.		// Compute the new bits that are at the top now.
APInt HighBits(APInt::getHighBitsSet(BitWidth, ShiftAmt));		APInt HighBits(APInt::getHighBitsSet(
		BitWidth, std::min(SignBits + ShiftAmt - 1, BitWidth)));
Known.Zero.lshrInPlace(ShiftAmt);		Known.Zero.lshrInPlace(ShiftAmt);
Known.One.lshrInPlace(ShiftAmt);		Known.One.lshrInPlace(ShiftAmt);

// If the input sign bit is known to be zero, or if none of the top bits		// If the input sign bit is known to be zero, or if none of the top bits
// are demanded, turn this into an unsigned shift right.		// are demanded, turn this into an unsigned shift right.
assert(BitWidth > ShiftAmt && "Shift amount not saturated?");		assert(BitWidth > ShiftAmt && "Shift amount not saturated?");
if (Known.Zero[BitWidth-ShiftAmt-1] \|\|		if (Known.Zero[BitWidth-ShiftAmt-1] \|\|
!DemandedMask.intersects(HighBits)) {		!DemandedMask.intersects(HighBits)) {
▲ Show 20 Lines • Show All 1,143 Lines • Show Last 20 Lines

test/Transforms/InstCombine/shift.ll

	Show First 20 Lines • Show All 215 Lines • ▼ Show 20 Lines
	; CHECK-NEXT: [[B1:%.*]] = and i32 %A, -256			; CHECK-NEXT: [[B1:%.*]] = and i32 %A, -256
	; CHECK-NEXT: ret i32 [[B1]]			; CHECK-NEXT: ret i32 [[B1]]
	;			;
	%B = ashr i32 %A, 8			%B = ashr i32 %A, 8
	%C = shl i32 %B, 8			%C = shl i32 %B, 8
	ret i32 %C			ret i32 %C
	}			}

				;; ((A \| 0xC0000000) >> 8) << 8 === (A & 3FFFFF00) \| 0xC0000000
				define i32 @test12a(i32 %A) {
				; CHECK-LABEL: @test12a(
				; CHECK-NEXT: [[a:%.*]] = and i32 %A, 1073741568
				; CHECK-NEXT: [[C:%.*]] = or i32 [[a]], -1073741824
				; CHECK-NEXT: ret i32 [[C]]
				;
				%a = or i32 %A, -1073741824
				%B = ashr i32 %a, 8
				%C = shl i32 %B, 8
				ret i32 %C
				}

	;; This transformation is deferred to DAGCombine:			;; This transformation is deferred to DAGCombine:
	;; (A >> 3) << 4 === (A & -8) * 2			;; (A >> 3) << 4 === (A & -8) * 2
	;; The shl may be valuable to scalar evolution.			;; The shl may be valuable to scalar evolution.
	define i8 @test13(i8 %A) {			define i8 @test13(i8 %A) {
	; CHECK-LABEL: @test13(			; CHECK-LABEL: @test13(
	; CHECK-NEXT: [[A:%.*]] = mul i8 %A, 3			; CHECK-NEXT: [[A:%.*]] = mul i8 %A, 3
	; CHECK-NEXT: [[B1:%.*]] = lshr i8 [[A]], 3			; CHECK-NEXT: [[B1:%.*]] = lshr i8 [[A]], 3
	; CHECK-NEXT: [[C:%.*]] = shl i8 [[B1]], 4			; CHECK-NEXT: [[C:%.*]] = shl i8 [[B1]], 4
	▲ Show 20 Lines • Show All 1,087 Lines • Show Last 20 Lines

test/Transforms/InstCombine/trunc.ll

	Show First 20 Lines • Show All 71 Lines • ▼ Show 20 Lines
	; CHECK-NEXT: ret i32 [[C]]			; CHECK-NEXT: ret i32 [[C]]
	;			;
	%B = zext i32 %A to i128			%B = zext i32 %A to i128
	%C = lshr i128 %B, 16			%C = lshr i128 %B, 16
	%D = trunc i128 %C to i32			%D = trunc i128 %C to i32
	ret i32 %D			ret i32 %D
	}			}

				define i32 @test5_ashr(i32 %A) {
				; CHECK-LABEL: @test5_ashr(
				; CHECK-NEXT: [[C:%.*]] = ashr i32 %A, 16
				; CHECK-NEXT: ret i32 [[C]]
				;
				%B = sext i32 %A to i128
				%C = ashr i128 %B, 16
				%D = trunc i128 %C to i32
				ret i32 %D
				}

	define i32 @test6(i64 %A) {			define i32 @test6(i64 %A) {
	; CHECK-LABEL: @test6(			; CHECK-LABEL: @test6(
	; CHECK-NEXT: [[C:%.*]] = lshr i64 %A, 32			; CHECK-NEXT: [[C:%.*]] = lshr i64 %A, 32
	; CHECK-NEXT: [[D:%.*]] = trunc i64 [[C]] to i32			; CHECK-NEXT: [[D:%.*]] = trunc i64 [[C]] to i32
	; CHECK-NEXT: ret i32 [[D]]			; CHECK-NEXT: ret i32 [[D]]
	;			;
	%B = zext i64 %A to i128			%B = zext i64 %A to i128
	%C = lshr i128 %B, 32			%C = lshr i128 %B, 32
	%D = trunc i128 %C to i32			%D = trunc i128 %C to i32
	ret i32 %D			ret i32 %D
	}			}

				define i32 @test6_lshr(i64 %A) {
				; CHECK-LABEL: @test6_lshr(
				; CHECK-NEXT: [[C:%.*]] = lshr i64 %A, 32
				; CHECK-NEXT: [[D:%.*]] = trunc i64 [[C]] to i32
				; CHECK-NEXT: ret i32 [[D]]
				;
				%B = sext i64 %A to i128
				%C = ashr i128 %B, 32
				%D = trunc i128 %C to i32
				ret i32 %D
				}

				define i64 @test6_ashr(i64 %A) {
				; CHECK-LABEL: @test6_ashr(
				; CHECK-NEXT: [[C:%.*]] = ashr i64 %A, 33
				; CHECK-NEXT: ret i64 [[C]]
				;
				%B = sext i64 %A to i128
				%C = ashr i128 %B, 33
				%D = trunc i128 %C to i64
				ret i64 %D
				}

				define i16 @test6_ashr_mul(i8 %X, i8 %Y) {
				; CHECK-LABEL: @test6_ashr_mul(
				; CHECK-NEXT: [[A:%.*]] = sext i8 %X to i16
				; CHECK-NEXT: [[B:%.*]] = sext i8 %Y to i16
				; CHECK-NEXT: [[C:%.*]] = mul nsw i16 [[A]], [[B]]
				; CHECK-NEXT: [[D:%.*]] = ashr i16 %C, 15
				; CHECK-NEXT: ret i16 %D
				%A = sext i8 %X to i32
				%B = sext i8 %Y to i32
				%C = mul i32 %A, %B
				%D = ashr i32 %C, 15
				%E = trunc i32 %D to i16
				ret i16 %E
				}

	define i92 @test7(i64 %A) {			define i92 @test7(i64 %A) {
	; CHECK-LABEL: @test7(			; CHECK-LABEL: @test7(
	; CHECK-NEXT: [[TMP1:%.*]] = lshr i64 %A, 32			; CHECK-NEXT: [[TMP1:%.*]] = lshr i64 %A, 32
	; CHECK-NEXT: [[D:%.*]] = zext i64 [[TMP1]] to i92			; CHECK-NEXT: [[D:%.*]] = zext i64 [[TMP1]] to i92
	; CHECK-NEXT: ret i92 [[D]]			; CHECK-NEXT: ret i92 [[D]]
	;			;
	%B = zext i64 %A to i128			%B = zext i64 %A to i128
	%C = lshr i128 %B, 32			%C = lshr i128 %B, 32
	%D = trunc i128 %C to i92			%D = trunc i128 %C to i92
	ret i92 %D			ret i92 %D
	}			}

				define i92 @test7_ashr(i64 %A) {
				; CHECK-LABEL: @test7_ashr(
				; CHECK-NEXT: [[B:%.*]] = sext i64 %A to i92
				; CHECK-NEXT: [[C:%.*]] = ashr i92 [[B]], 32
				; CHECK-NEXT: ret i92 [[C]]
				;
				%B = sext i64 %A to i128
				%C = ashr i128 %B, 32
				%D = trunc i128 %C to i92
				ret i92 %D
				}

	define i64 @test8(i32 %A, i32 %B) {			define i64 @test8(i32 %A, i32 %B) {
	; CHECK-LABEL: @test8(			; CHECK-LABEL: @test8(
	; CHECK-NEXT: [[TMP38:%.*]] = zext i32 %A to i64			; CHECK-NEXT: [[TMP38:%.*]] = zext i32 %A to i64
	; CHECK-NEXT: [[TMP32:%.*]] = zext i32 %B to i64			; CHECK-NEXT: [[TMP32:%.*]] = zext i32 %B to i64
	; CHECK-NEXT: [[TMP33:%.*]] = shl nuw i64 [[TMP32]], 32			; CHECK-NEXT: [[TMP33:%.*]] = shl nuw i64 [[TMP32]], 32
	; CHECK-NEXT: [[INS35:%.*]] = or i64 [[TMP33]], [[TMP38]]			; CHECK-NEXT: [[INS35:%.*]] = or i64 [[TMP33]], [[TMP38]]
	; CHECK-NEXT: ret i64 [[INS35]]			; CHECK-NEXT: ret i64 [[INS35]]
	;			;
	▲ Show 20 Lines • Show All 457 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[InstCombine] Added support for: trunc(ashr(mul(sext(...), sext(...))) -> ashr(mul(...))
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 110960

lib/Analysis/ValueTracking.cpp

lib/Transforms/InstCombine/InstCombineCasts.cpp

lib/Transforms/InstCombine/InstCombineShifts.cpp

lib/Transforms/InstCombine/InstCombineSimplifyDemanded.cpp

test/Transforms/InstCombine/shift.ll

test/Transforms/InstCombine/trunc.ll

This is an archive of the discontinued LLVM Phabricator instance.

[InstCombine] Added support for: trunc(ashr(mul(sext(...), sext(...))) -> ashr(mul(...))ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 110960

lib/Analysis/ValueTracking.cpp

lib/Transforms/InstCombine/InstCombineCasts.cpp

lib/Transforms/InstCombine/InstCombineShifts.cpp

lib/Transforms/InstCombine/InstCombineSimplifyDemanded.cpp

test/Transforms/InstCombine/shift.ll

test/Transforms/InstCombine/trunc.ll

[InstCombine] Added support for: trunc(ashr(mul(sext(...), sext(...))) -> ashr(mul(...))
ClosedPublic