Diff 496307

llvm/lib/Transforms/InstCombine/InstCombineCompares.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

Show First 20 Lines • Show All 4,903 Lines • ▼ Show 20 Lines	Instruction *InstCombinerImpl::foldICmpEquality(ICmpInst &I) {
if (match(Op1, m_c_And(m_Specific(Op0), m_Value())) &&		if (match(Op1, m_c_And(m_Specific(Op0), m_Value())) &&
isKnownToBeAPowerOfTwo(Op0, /* OrZero */ false, 0, &I))		isKnownToBeAPowerOfTwo(Op0, /* OrZero */ false, 0, &I))
return new ICmpInst(CmpInst::getInversePredicate(Pred), Op1,		return new ICmpInst(CmpInst::getInversePredicate(Pred), Op1,
ConstantInt::getNullValue(Op1->getType()));		ConstantInt::getNullValue(Op1->getType()));

return nullptr;		return nullptr;
}		}

static Instruction *foldICmpWithTrunc(ICmpInst &ICmp,		Instruction *InstCombinerImpl::foldICmpWithTrunc(ICmpInst &ICmp) {
InstCombiner::BuilderTy &Builder) {
ICmpInst::Predicate Pred = ICmp.getPredicate();		ICmpInst::Predicate Pred = ICmp.getPredicate();
Value Op0 = ICmp.getOperand(0), Op1 = ICmp.getOperand(1);		Value Op0 = ICmp.getOperand(0), Op1 = ICmp.getOperand(1);

// Try to canonicalize trunc + compare-to-constant into a mask + cmp.		// Try to canonicalize trunc + compare-to-constant into a mask + cmp.
// The trunc masks high bits while the compare may effectively mask low bits.		// The trunc masks high bits while the compare may effectively mask low bits.
Value *X;		Value *X;
const APInt *C;		const APInt *C;
if (!match(Op0, m_OneUse(m_Trunc(m_Value(X)))) \|\| !match(Op1, m_APInt(C)))		if (!match(Op0, m_OneUse(m_Trunc(m_Value(X)))) \|\| !match(Op1, m_APInt(C)))
Show All 21 Lines	Instruction *InstCombinerImpl::foldICmpWithTrunc(ICmpInst &ICmp) {
if (Pred == ICmpInst::ICMP_UGT && (~*C).isPowerOf2()) {		if (Pred == ICmpInst::ICMP_UGT && (~*C).isPowerOf2()) {
// If C is not-of-power-of-2 (one clear bit):		// If C is not-of-power-of-2 (one clear bit):
// (trunc X) u> C --> (X & (C+1)) == C+1 (are all masked-high-bits set?)		// (trunc X) u> C --> (X & (C+1)) == C+1 (are all masked-high-bits set?)
Constant MaskC = ConstantInt::get(X->getType(), (C + 1).zext(SrcBits));		Constant MaskC = ConstantInt::get(X->getType(), (C + 1).zext(SrcBits));
Value *And = Builder.CreateAnd(X, MaskC);		Value *And = Builder.CreateAnd(X, MaskC);
return new ICmpInst(ICmpInst::ICMP_EQ, And, MaskC);		return new ICmpInst(ICmpInst::ICMP_EQ, And, MaskC);
}		}

		if (auto *II = dyn_cast<IntrinsicInst>(X)) {
		goldstein.w.nUnsubmitted Not Done Reply Inline Actions Imo it makes more sense to do this generically. `(icmp P (trunc(X), C))` if `KnownBits(X)[OrigWidth:TruncWidth] == 0` just drop the truncate. That will cover all these intrins + any other cases that happen to come up. goldstein.w.n: Imo it makes more sense to do this generically. `(icmp P (trunc(X), C))` if `KnownBits(X)…
		bcl5980AuthorUnsubmitted Done Reply Inline Actions I don't want to enable all cases for the trunc. That may cause a lot of potential regressions. By default we should shrink bits if possible not expand it. I prefer to limited the change to the case we can really get improvement. Maybe I can move this change to SDAG to avoid these concern. bcl5980: I don't want to enable all cases for the trunc. That may cause a lot of potential regressions.
		goldstein.w.nUnsubmitted Not Done Reply Inline Actions Seems to only match `m_Oneuse(m_Trunc(...))` so seems like only case is the truncate is entirely eliminated, no? Not sure I see how that could cause regressions. goldstein.w.n: Seems to only match `m_Oneuse(m_Trunc(...))` so seems like only case is the truncate is…
		bcl5980AuthorUnsubmitted Done Reply Inline Actions What I mean is not IR level regression. Think about the case source type is i256, the dest type is i32. Remove the trunc and restore the next instruct to be i256 may cause extra instruction on backend. bcl5980: What I mean is not IR level regression. Think about the case source type is i256, the dest type…
		spatelUnsubmitted Not Done Reply Inline Actions This is a gray area. Ideally, if we can eliminate IR instructions, we do it, but it if it results in wider instructions, then it's potentially not an improvement for analysis in IR. The codegen concern is secondary, but yes, we do factor that into the decision because sometimes it is not easy to invert the transform. For this one, it seems unlikely that we'll gain much by using a potentially expensive (in compile-time) ValueTracking API because we probably already have specialized folds for the common patterns where we'd know the high bits are already cleared ('and' or 'lshr'). spatel: This is a gray area. Ideally, if we can eliminate IR instructions, we do it, but it if it…
		if (II->getIntrinsicID() == Intrinsic::cttz \|\|
		II->getIntrinsicID() == Intrinsic::ctlz) {
		unsigned MaxRet = SrcBits;
		spatelUnsubmitted Not Done Reply Inline Actions Require one less bit for cttz/ctlz when the "is_zero_poison" argument is true? spatel: Require one less bit for cttz/ctlz when the "is_zero_poison" argument is true?
		bcl5980AuthorUnsubmitted Done Reply Inline Actions https://alive2.llvm.org/ce/z/pQQavA It looks one less bit for cttz when is_zero_poison=true is wrong. bcl5980: https://alive2.llvm.org/ce/z/pQQavA It looks one less bit for cttz when is_zero_poison=true is…
		bcl5980AuthorUnsubmitted Done Reply Inline Actions ah, I'm wrong. Should be llvm::Log2_32_Ceil(SrcBits - is_zero_poison), not Op0 bitwidth - is_zero_poison bcl5980: ah, I'm wrong. Should be llvm::Log2_32_Ceil(SrcBits - is_zero_poison), not Op0 bitwidth…
		// If the "is_zero_poison" argument is set, then we know at least
		// one bit is set in the input, so the result is always at least one
		spatelUnsubmitted Not Done Reply Inline Actions This needs an explanation comment. Something like: // If the "is_zero_poison" argument is set, then we know at least // one bit is set in the input, so the result is always at least one // less than the full bitwidth of that input. spatel: This needs an explanation comment. Something like: // If the "is_zero_poison" argument is set…
		// less than the full bitwidth of that input.
		if (match(II->getArgOperand(1), m_One()))
		spatelUnsubmitted Not Done Reply Inline Actions Adjust word choice: // Make sure the destination is wide enough to hold the largest output of the intrinsic. spatel: Adjust word choice: // Make sure the destination is wide enough to hold the largest output of…
		MaxRet--;

		// Make sure the destination is wide enough to hold the largest output of
		// the intrinsic.
		if (llvm::Log2_32(MaxRet) + 1 <= Op0->getType()->getScalarSizeInBits())
		if (Instruction *I =
		foldICmpIntrinsicWithConstant(ICmp, II, C->zext(SrcBits)))
		return I;
		}
		}

return nullptr;		return nullptr;
}		}

Instruction *InstCombinerImpl::foldICmpWithZextOrSext(ICmpInst &ICmp) {		Instruction *InstCombinerImpl::foldICmpWithZextOrSext(ICmpInst &ICmp) {
assert(isa<CastInst>(ICmp.getOperand(0)) && "Expected cast for operand 0");		assert(isa<CastInst>(ICmp.getOperand(0)) && "Expected cast for operand 0");
auto *CastOp0 = cast<CastInst>(ICmp.getOperand(0));		auto *CastOp0 = cast<CastInst>(ICmp.getOperand(0));
Value *X;		Value *X;
if (!match(CastOp0, m_ZExtOrSExt(m_Value(X))))		if (!match(CastOp0, m_ZExtOrSExt(m_Value(X))))
▲ Show 20 Lines • Show All 141 Lines • ▼ Show 20 Lines	if (CastOp0->getOpcode() == Instruction::PtrToInt &&
} else if (auto *RHSC = dyn_cast<Constant>(ICmp.getOperand(1))) {		} else if (auto *RHSC = dyn_cast<Constant>(ICmp.getOperand(1))) {
NewOp1 = ConstantExpr::getIntToPtr(RHSC, SrcTy);		NewOp1 = ConstantExpr::getIntToPtr(RHSC, SrcTy);
}		}

if (NewOp1)		if (NewOp1)
return new ICmpInst(ICmp.getPredicate(), Op0Src, NewOp1);		return new ICmpInst(ICmp.getPredicate(), Op0Src, NewOp1);
}		}

if (Instruction *R = foldICmpWithTrunc(ICmp, Builder))		if (Instruction *R = foldICmpWithTrunc(ICmp))
return R;		return R;

return foldICmpWithZextOrSext(ICmp);		return foldICmpWithZextOrSext(ICmp);
}		}

static bool isNeutralValue(Instruction::BinaryOps BinaryOp, Value *RHS, bool IsSigned) {		static bool isNeutralValue(Instruction::BinaryOps BinaryOp, Value *RHS, bool IsSigned) {
switch (BinaryOp) {		switch (BinaryOp) {
default:		default:
▲ Show 20 Lines • Show All 2,053 Lines • Show Last 20 Lines

llvm/lib/Transforms/InstCombine/InstCombineInternal.h

Show First 20 Lines • Show All 618 Lines • ▼ Show 20 Lines	public:
Instruction *foldICmpBinOpEqualityWithConstant(ICmpInst &Cmp,		Instruction *foldICmpBinOpEqualityWithConstant(ICmpInst &Cmp,
BinaryOperator *BO,		BinaryOperator *BO,
const APInt &C);		const APInt &C);
Instruction foldICmpIntrinsicWithConstant(ICmpInst &ICI, IntrinsicInst II,		Instruction foldICmpIntrinsicWithConstant(ICmpInst &ICI, IntrinsicInst II,
const APInt &C);		const APInt &C);
Instruction foldICmpEqIntrinsicWithConstant(ICmpInst &ICI, IntrinsicInst II,		Instruction foldICmpEqIntrinsicWithConstant(ICmpInst &ICI, IntrinsicInst II,
const APInt &C);		const APInt &C);
Instruction *foldICmpBitCast(ICmpInst &Cmp);		Instruction *foldICmpBitCast(ICmpInst &Cmp);
		Instruction *foldICmpWithTrunc(ICmpInst &Cmp);

// Helpers of visitSelectInst().		// Helpers of visitSelectInst().
Instruction *foldSelectOfBools(SelectInst &SI);		Instruction *foldSelectOfBools(SelectInst &SI);
Instruction *foldSelectExtConst(SelectInst &Sel);		Instruction *foldSelectExtConst(SelectInst &Sel);
Instruction foldSelectOpOp(SelectInst &SI, Instruction TI, Instruction *FI);		Instruction foldSelectOpOp(SelectInst &SI, Instruction TI, Instruction *FI);
Instruction foldSelectIntoOp(SelectInst &SI, Value , Value *);		Instruction foldSelectIntoOp(SelectInst &SI, Value , Value *);
Instruction foldSPFofSPF(Instruction Inner, SelectPatternFlavor SPF1,		Instruction foldSPFofSPF(Instruction Inner, SelectPatternFlavor SPF1,
Value A, Value B, Instruction &Outer,		Value A, Value B, Instruction &Outer,
▲ Show 20 Lines • Show All 79 Lines • Show Last 20 Lines

llvm/test/Transforms/InstCombine/cmp-intrinsic.ll

Show First 20 Lines • Show All 537 Lines • ▼ Show 20 Lines	;
%tz = tail call i33 @llvm.cttz.i33(i33 %x, i1 false)		%tz = tail call i33 @llvm.cttz.i33(i33 %x, i1 false)
%trunc = trunc i33 %tz to i15		%trunc = trunc i33 %tz to i15
%cmp = icmp ugt i15 %trunc, 3		%cmp = icmp ugt i15 %trunc, 3
ret i1 %cmp		ret i1 %cmp
}		}

define i1 @trunc_cttz_ult_other_i33_i6(i33 %x) {		define i1 @trunc_cttz_ult_other_i33_i6(i33 %x) {
; CHECK-LABEL: @trunc_cttz_ult_other_i33_i6(		; CHECK-LABEL: @trunc_cttz_ult_other_i33_i6(
; CHECK-NEXT: [[TZ:%.]] = tail call i33 @llvm.cttz.i33(i33 [[X:%.]], i1 true), !range [[RNG1]]		; CHECK-NEXT: [[TMP1:%.]] = and i33 [[X:%.]], 127
; CHECK-NEXT: [[TRUNC:%.*]] = trunc i33 [[TZ]] to i6		; CHECK-NEXT: [[CMP:%.*]] = icmp ne i33 [[TMP1]], 0
; CHECK-NEXT: [[CMP:%.*]] = icmp ult i6 [[TRUNC]], 7
; CHECK-NEXT: ret i1 [[CMP]]		; CHECK-NEXT: ret i1 [[CMP]]
;		;
%tz = tail call i33 @llvm.cttz.i33(i33 %x, i1 true)		%tz = tail call i33 @llvm.cttz.i33(i33 %x, i1 true)
		spatelUnsubmitted Not Done Reply Inline Actions Why truncate to i15? IIUC, the transform is valid on this example for truncate down to 6 bits, but not 5 bits. So we should have both of those variations. The source type width should be tested similarly, so if we start with i32, it is ok to truncate to i5, but not i4? spatel: Why truncate to i15? IIUC, the transform is valid on this example for truncate down to 6 bits…
%trunc = trunc i33 %tz to i6		%trunc = trunc i33 %tz to i6
%cmp = icmp ult i6 %trunc, 7		%cmp = icmp ult i6 %trunc, 7
ret i1 %cmp		ret i1 %cmp
}		}

		; negative case: log2(33 - is_zero_poison ? 1 : 0) + 1 > 5

define i1 @trunc_cttz_ult_other_i33_i5(i33 %x) {		define i1 @trunc_cttz_ult_other_i33_i5(i33 %x) {
; CHECK-LABEL: @trunc_cttz_ult_other_i33_i5(		; CHECK-LABEL: @trunc_cttz_ult_other_i33_i5(
; CHECK-NEXT: [[TZ:%.]] = tail call i33 @llvm.cttz.i33(i33 [[X:%.]], i1 true), !range [[RNG1]]		; CHECK-NEXT: [[TZ:%.]] = tail call i33 @llvm.cttz.i33(i33 [[X:%.]], i1 true), !range [[RNG1]]
; CHECK-NEXT: [[TRUNC:%.*]] = trunc i33 [[TZ]] to i5		; CHECK-NEXT: [[TRUNC:%.*]] = trunc i33 [[TZ]] to i5
; CHECK-NEXT: [[CMP:%.*]] = icmp ult i5 [[TRUNC]], 7		; CHECK-NEXT: [[CMP:%.*]] = icmp ult i5 [[TRUNC]], 7
; CHECK-NEXT: ret i1 [[CMP]]		; CHECK-NEXT: ret i1 [[CMP]]
;		;
%tz = tail call i33 @llvm.cttz.i33(i33 %x, i1 true)		%tz = tail call i33 @llvm.cttz.i33(i33 %x, i1 true)
%trunc = trunc i33 %tz to i5		%trunc = trunc i33 %tz to i5
%cmp = icmp ult i5 %trunc, 7		%cmp = icmp ult i5 %trunc, 7
ret i1 %cmp		ret i1 %cmp
}		}

define i1 @trunc_cttz_true_ult_other_i32_i5(i32 %x) {		define i1 @trunc_cttz_true_ult_other_i32_i5(i32 %x) {
; CHECK-LABEL: @trunc_cttz_true_ult_other_i32_i5(		; CHECK-LABEL: @trunc_cttz_true_ult_other_i32_i5(
; CHECK-NEXT: [[TZ:%.]] = tail call i32 @llvm.cttz.i32(i32 [[X:%.]], i1 true), !range [[RNG0]]		; CHECK-NEXT: [[TMP1:%.]] = and i32 [[X:%.]], 127
; CHECK-NEXT: [[TRUNC:%.*]] = trunc i32 [[TZ]] to i5		; CHECK-NEXT: [[CMP:%.*]] = icmp ne i32 [[TMP1]], 0
; CHECK-NEXT: [[CMP:%.*]] = icmp ult i5 [[TRUNC]], 7
; CHECK-NEXT: ret i1 [[CMP]]		; CHECK-NEXT: ret i1 [[CMP]]
;		;
%tz = tail call i32 @llvm.cttz.i32(i32 %x, i1 true)		%tz = tail call i32 @llvm.cttz.i32(i32 %x, i1 true)
%trunc = trunc i32 %tz to i5		%trunc = trunc i32 %tz to i5
%cmp = icmp ult i5 %trunc, 7		%cmp = icmp ult i5 %trunc, 7
ret i1 %cmp		ret i1 %cmp
}		}

Show All 9 Lines	;
%tz = tail call i32 @llvm.cttz.i32(i32 %x, i1 false)		%tz = tail call i32 @llvm.cttz.i32(i32 %x, i1 false)
%trunc = trunc i32 %tz to i5		%trunc = trunc i32 %tz to i5
%cmp = icmp ult i5 %trunc, 7		%cmp = icmp ult i5 %trunc, 7
ret i1 %cmp		ret i1 %cmp
}		}

define i1 @trunc_cttz_false_ult_other_i32_i6(i32 %x) {		define i1 @trunc_cttz_false_ult_other_i32_i6(i32 %x) {
; CHECK-LABEL: @trunc_cttz_false_ult_other_i32_i6(		; CHECK-LABEL: @trunc_cttz_false_ult_other_i32_i6(
; CHECK-NEXT: [[TZ:%.]] = tail call i32 @llvm.cttz.i32(i32 [[X:%.]], i1 false), !range [[RNG0]]		; CHECK-NEXT: [[TMP1:%.]] = and i32 [[X:%.]], 127
; CHECK-NEXT: [[TRUNC:%.*]] = trunc i32 [[TZ]] to i6		; CHECK-NEXT: [[CMP:%.*]] = icmp ne i32 [[TMP1]], 0
; CHECK-NEXT: [[CMP:%.*]] = icmp ult i6 [[TRUNC]], 7
; CHECK-NEXT: ret i1 [[CMP]]		; CHECK-NEXT: ret i1 [[CMP]]
;		;
%tz = tail call i32 @llvm.cttz.i32(i32 %x, i1 false)		%tz = tail call i32 @llvm.cttz.i32(i32 %x, i1 false)
%trunc = trunc i32 %tz to i6		%trunc = trunc i32 %tz to i6
%cmp = icmp ult i6 %trunc, 7		%cmp = icmp ult i6 %trunc, 7
ret i1 %cmp		ret i1 %cmp
}		}

Show All 33 Lines	;
%lz = tail call i32 @llvm.ctlz.i32(i32 %x, i1 false)		%lz = tail call i32 @llvm.ctlz.i32(i32 %x, i1 false)
%trunc = trunc i32 %lz to i15		%trunc = trunc i32 %lz to i15
%cmp = icmp ugt i15 %trunc, 1		%cmp = icmp ugt i15 %trunc, 1
ret i1 %cmp		ret i1 %cmp
}		}

define i1 @trunc_ctlz_ugt_other_i33_i6(i33 %x) {		define i1 @trunc_ctlz_ugt_other_i33_i6(i33 %x) {
; CHECK-LABEL: @trunc_ctlz_ugt_other_i33_i6(		; CHECK-LABEL: @trunc_ctlz_ugt_other_i33_i6(
; CHECK-NEXT: [[LZ:%.]] = tail call i33 @llvm.ctlz.i33(i33 [[X:%.]], i1 true), !range [[RNG1]]		; CHECK-NEXT: [[CMP:%.]] = icmp ult i33 [[X:%.]], 268435456
; CHECK-NEXT: [[TRUNC:%.*]] = trunc i33 [[LZ]] to i6
; CHECK-NEXT: [[CMP:%.*]] = icmp ugt i6 [[TRUNC]], 4
; CHECK-NEXT: ret i1 [[CMP]]		; CHECK-NEXT: ret i1 [[CMP]]
;		;
%lz = tail call i33 @llvm.ctlz.i33(i33 %x, i1 true)		%lz = tail call i33 @llvm.ctlz.i33(i33 %x, i1 true)
%trunc = trunc i33 %lz to i6		%trunc = trunc i33 %lz to i6
%cmp = icmp ugt i6 %trunc, 4		%cmp = icmp ugt i6 %trunc, 4
ret i1 %cmp		ret i1 %cmp
}		}

		; negative case: log2(33 - is_zero_poison ? 1 : 0) + 1 > 5

define i1 @trunc_ctlz_ugt_other_i33_i5(i33 %x) {		define i1 @trunc_ctlz_ugt_other_i33_i5(i33 %x) {
; CHECK-LABEL: @trunc_ctlz_ugt_other_i33_i5(		; CHECK-LABEL: @trunc_ctlz_ugt_other_i33_i5(
; CHECK-NEXT: [[LZ:%.]] = tail call i33 @llvm.ctlz.i33(i33 [[X:%.]], i1 true), !range [[RNG1]]		; CHECK-NEXT: [[LZ:%.]] = tail call i33 @llvm.ctlz.i33(i33 [[X:%.]], i1 true), !range [[RNG1]]
; CHECK-NEXT: [[TRUNC:%.*]] = trunc i33 [[LZ]] to i5		; CHECK-NEXT: [[TRUNC:%.*]] = trunc i33 [[LZ]] to i5
; CHECK-NEXT: [[CMP:%.*]] = icmp ugt i5 [[TRUNC]], 4		; CHECK-NEXT: [[CMP:%.*]] = icmp ugt i5 [[TRUNC]], 4
; CHECK-NEXT: ret i1 [[CMP]]		; CHECK-NEXT: ret i1 [[CMP]]
;		;
%lz = tail call i33 @llvm.ctlz.i33(i33 %x, i1 true)		%lz = tail call i33 @llvm.ctlz.i33(i33 %x, i1 true)
%trunc = trunc i33 %lz to i5		%trunc = trunc i33 %lz to i5
%cmp = icmp ugt i5 %trunc, 4		%cmp = icmp ugt i5 %trunc, 4
ret i1 %cmp		ret i1 %cmp
}		}

define i1 @trunc_ctlz_true_ugt_other_i32_i5(i32 %x) {		define i1 @trunc_ctlz_true_ugt_other_i32_i5(i32 %x) {
; CHECK-LABEL: @trunc_ctlz_true_ugt_other_i32_i5(		; CHECK-LABEL: @trunc_ctlz_true_ugt_other_i32_i5(
; CHECK-NEXT: [[LZ:%.]] = tail call i32 @llvm.ctlz.i32(i32 [[X:%.]], i1 true), !range [[RNG0]]		; CHECK-NEXT: [[CMP:%.]] = icmp ult i32 [[X:%.]], 134217728
; CHECK-NEXT: [[TRUNC:%.*]] = trunc i32 [[LZ]] to i5
; CHECK-NEXT: [[CMP:%.*]] = icmp ugt i5 [[TRUNC]], 4
; CHECK-NEXT: ret i1 [[CMP]]		; CHECK-NEXT: ret i1 [[CMP]]
;		;
%lz = tail call i32 @llvm.ctlz.i32(i32 %x, i1 true)		%lz = tail call i32 @llvm.ctlz.i32(i32 %x, i1 true)
%trunc = trunc i32 %lz to i5		%trunc = trunc i32 %lz to i5
%cmp = icmp ugt i5 %trunc, 4		%cmp = icmp ugt i5 %trunc, 4
ret i1 %cmp		ret i1 %cmp
}		}

Show All 9 Lines	;
%lz = tail call i32 @llvm.ctlz.i32(i32 %x, i1 false)		%lz = tail call i32 @llvm.ctlz.i32(i32 %x, i1 false)
%trunc = trunc i32 %lz to i5		%trunc = trunc i32 %lz to i5
%cmp = icmp ugt i5 %trunc, 4		%cmp = icmp ugt i5 %trunc, 4
ret i1 %cmp		ret i1 %cmp
}		}

define i1 @trunc_ctlz_false_ugt_other_i32_i6(i32 %x) {		define i1 @trunc_ctlz_false_ugt_other_i32_i6(i32 %x) {
; CHECK-LABEL: @trunc_ctlz_false_ugt_other_i32_i6(		; CHECK-LABEL: @trunc_ctlz_false_ugt_other_i32_i6(
; CHECK-NEXT: [[LZ:%.]] = tail call i32 @llvm.ctlz.i32(i32 [[X:%.]], i1 false), !range [[RNG0]]		; CHECK-NEXT: [[CMP:%.]] = icmp ult i32 [[X:%.]], 134217728
; CHECK-NEXT: [[TRUNC:%.*]] = trunc i32 [[LZ]] to i6
; CHECK-NEXT: [[CMP:%.*]] = icmp ugt i6 [[TRUNC]], 4
; CHECK-NEXT: ret i1 [[CMP]]		; CHECK-NEXT: ret i1 [[CMP]]
;		;
%lz = tail call i32 @llvm.ctlz.i32(i32 %x, i1 false)		%lz = tail call i32 @llvm.ctlz.i32(i32 %x, i1 false)
%trunc = trunc i32 %lz to i6		%trunc = trunc i32 %lz to i6
%cmp = icmp ugt i6 %trunc, 4		%cmp = icmp ugt i6 %trunc, 4
ret i1 %cmp		ret i1 %cmp
}		}

Show All 31 Lines
; CHECK-NEXT: ret i1 [[CMP]]		; CHECK-NEXT: ret i1 [[CMP]]
;		;
%pop = tail call i8 @llvm.ctpop.i8(i8 %x)		%pop = tail call i8 @llvm.ctpop.i8(i8 %x)
%trunc = trunc i8 %pop to i5		%trunc = trunc i8 %pop to i5
%cmp = icmp eq i5 %trunc, 8		%cmp = icmp eq i5 %trunc, 8
ret i1 %cmp		ret i1 %cmp
}		}

		; negative case: log2(33) + 1 > 4

define i1 @trunc_negative_destbits_not_enough(i33 %x) {		define i1 @trunc_negative_destbits_not_enough(i33 %x) {
; CHECK-LABEL: @trunc_negative_destbits_not_enough(		; CHECK-LABEL: @trunc_negative_destbits_not_enough(
; CHECK-NEXT: [[TZ:%.]] = tail call i33 @llvm.cttz.i33(i33 [[X:%.]], i1 false), !range [[RNG1]]		; CHECK-NEXT: [[TZ:%.]] = tail call i33 @llvm.cttz.i33(i33 [[X:%.]], i1 false), !range [[RNG1]]
; CHECK-NEXT: [[TRUNC:%.*]] = trunc i33 [[TZ]] to i4		; CHECK-NEXT: [[TRUNC:%.*]] = trunc i33 [[TZ]] to i4
; CHECK-NEXT: [[CMP:%.*]] = icmp ult i4 [[TRUNC]], 7		; CHECK-NEXT: [[CMP:%.*]] = icmp ult i4 [[TRUNC]], 7
; CHECK-NEXT: ret i1 [[CMP]]		; CHECK-NEXT: ret i1 [[CMP]]
;		;
%tz = tail call i33 @llvm.cttz.i33(i33 %x, i1 false)		%tz = tail call i33 @llvm.cttz.i33(i33 %x, i1 false)
%trunc = trunc i33 %tz to i4		%trunc = trunc i33 %tz to i4
%cmp = icmp ult i4 %trunc, 7		%cmp = icmp ult i4 %trunc, 7
ret i1 %cmp		ret i1 %cmp
}		}

This is an archive of the discontinued LLVM Phabricator instance.

[InstCombine] Look through truncate to fold icmp with intrinsics
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 496307

llvm/lib/Transforms/InstCombine/InstCombineCompares.cpp

llvm/lib/Transforms/InstCombine/InstCombineInternal.h

llvm/test/Transforms/InstCombine/cmp-intrinsic.ll

This is an archive of the discontinued LLVM Phabricator instance.

[InstCombine] Look through truncate to fold icmp with intrinsicsClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 496307

llvm/lib/Transforms/InstCombine/InstCombineCompares.cpp

llvm/lib/Transforms/InstCombine/InstCombineInternal.h

llvm/test/Transforms/InstCombine/cmp-intrinsic.ll

[InstCombine] Look through truncate to fold icmp with intrinsics
ClosedPublic