This is an archive of the discontinued LLVM Phabricator instance.

[InstCombine] Move an optimization from foldICmpAndConstConst to foldICmpUsingKnownBits
ClosedPublic

Authored by craig.topper on Sep 22 2017, 3:08 PM.

Download Raw Diff

Details

Reviewers

Commits

rG30dc9797e9fd: [InstCombine] Move an optimization from foldICmpAndConstConst to…
rL314153: [InstCombine] Move an optimization from foldICmpAndConstConst to…

Summary

All this optimization cares about is knowing how many low bits of LHS is known to be zero and whether that means that the result is 0 or greater than the RHS constant. It doesn't matter where the zeros in the low bits came from. So we don't need to specifically look for an AND. Instead we can use known bits.

Diff Detail

Event Timeline

craig.topper created this revision.Sep 22 2017, 3:08 PM

Forgot to add full context

LGTM.

Given that we're already calling computeKnownBits here, this seems ok. Is there a real motivating benchmark though? If so, I think you want to add a reduction of that, so we're less likely to lose it if/when there's a rewrite of instcombine.

Also, I commented on D38206 before I saw this patch, so this patch may make that comment moot. Although similar to this case, another test to check a less restricted version would be good if you've seen it in the real world.

This revision is now accepted and ready to land.Sep 25 2017, 1:45 PM

This didn't come from any real benchmark. The one use restriction on foldICmpAndShift was something I saw in real code. Though it was with a ashr, so I still have another patch to come. Then while I was reviewing the nearby code I saw the missing inverse case on this transform which I fixed last week in D38065. But then I started thinking about it more and thought maybe we should handle any kind of zeros and not just zeros created by ands.

Closed by commit rL314153: [InstCombine] Move an optimization from foldICmpAndConstConst to… (authored by ctopper). · Explain WhySep 25 2017, 2:16 PM

This revision was automatically updated to reflect the committed changes.

Revision Contents

Path

Size

lib/

Transforms/

InstCombine/

InstCombineCompares.cpp

26 lines

Diff 116414

lib/Transforms/InstCombine/InstCombineCompares.cpp

Show First 20 Lines • Show All 1,708 Lines • ▼ Show 20 Lines	if (match(Or, m_Or(m_Value(LShr), m_Value(A))) &&
if (NewOr) {		if (NewOr) {
Value *NewAnd = Builder.CreateAnd(A, NewOr, And->getName());		Value *NewAnd = Builder.CreateAnd(A, NewOr, And->getName());
Cmp.setOperand(0, NewAnd);		Cmp.setOperand(0, NewAnd);
return &Cmp;		return &Cmp;
}		}
}		}
}		}

// (X & C2) > C1 --> (X & C2) != 0, if any bit set in (X & C2) will produce a
// result greater than C1. Also handle (X & C2) < C1 --> (X & C2) == 0.
if (!C2->isNullValue()) {
unsigned NumTZ = C2->countTrailingZeros();
if (Cmp.getPredicate() == ICmpInst::ICMP_UGT &&
NumTZ >= C1->getActiveBits()) {
Constant *Zero = Constant::getNullValue(And->getType());
return new ICmpInst(ICmpInst::ICMP_NE, And, Zero);
}
if (Cmp.getPredicate() == ICmpInst::ICMP_ULT &&
NumTZ >= C1->ceilLogBase2()) {
Constant *Zero = Constant::getNullValue(And->getType());
return new ICmpInst(ICmpInst::ICMP_EQ, And, Zero);
}
}

return nullptr;		return nullptr;
}		}

/// Fold icmp (and X, Y), C.		/// Fold icmp (and X, Y), C.
Instruction *InstCombiner::foldICmpAndConstant(ICmpInst &Cmp,		Instruction *InstCombiner::foldICmpAndConstant(ICmpInst &Cmp,
BinaryOperator *And,		BinaryOperator *And,
const APInt *C) {		const APInt *C) {
if (Instruction *I = foldICmpAndConstConst(Cmp, And, C))		if (Instruction *I = foldICmpAndConstConst(Cmp, And, C))
▲ Show 20 Lines • Show All 2,475 Lines • ▼ Show 20 Lines	case ICmpInst::ICMP_ULT: {
if (Op1Min == Op0Max) // A <u B -> A != B if max(A) == min(B)		if (Op1Min == Op0Max) // A <u B -> A != B if max(A) == min(B)
return new ICmpInst(ICmpInst::ICMP_NE, Op0, Op1);		return new ICmpInst(ICmpInst::ICMP_NE, Op0, Op1);

if (Op1Min == Op1Max) {		if (Op1Min == Op1Max) {
// A <u C -> A == C-1 if min(A)+1 == C		// A <u C -> A == C-1 if min(A)+1 == C
if (Op1Min == Op0Min + 1)		if (Op1Min == Op0Min + 1)
return new ICmpInst(ICmpInst::ICMP_EQ, Op0,		return new ICmpInst(ICmpInst::ICMP_EQ, Op0,
ConstantInt::get(Op0->getType(), Op1Min - 1));		ConstantInt::get(Op0->getType(), Op1Min - 1));
		// X <u C --> X == 0, if the number of zero bits in the bottom of X
		// exceeds the log2 of C.
		if (Op0Known.countMinTrailingZeros() >= Op1Min.ceilLogBase2())
		return new ICmpInst(ICmpInst::ICMP_EQ, Op0,
		Constant::getNullValue(Op1->getType()));
}		}
break;		break;
}		}
case ICmpInst::ICMP_UGT: {		case ICmpInst::ICMP_UGT: {
if (Op0Min.ugt(Op1Max)) // A >u B -> true if min(A) > max(B)		if (Op0Min.ugt(Op1Max)) // A >u B -> true if min(A) > max(B)
return replaceInstUsesWith(I, ConstantInt::getTrue(I.getType()));		return replaceInstUsesWith(I, ConstantInt::getTrue(I.getType()));
if (Op0Max.ule(Op1Min)) // A >u B -> false if max(A) <= max(B)		if (Op0Max.ule(Op1Min)) // A >u B -> false if max(A) <= max(B)
return replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));		return replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));
if (Op1Max == Op0Min) // A >u B -> A != B if min(A) == max(B)		if (Op1Max == Op0Min) // A >u B -> A != B if min(A) == max(B)
return new ICmpInst(ICmpInst::ICMP_NE, Op0, Op1);		return new ICmpInst(ICmpInst::ICMP_NE, Op0, Op1);

if (Op1Min == Op1Max) {		if (Op1Min == Op1Max) {
// A >u C -> A == C+1 if max(a)-1 == C		// A >u C -> A == C+1 if max(a)-1 == C
if (Op1Min == Op0Max - 1)		if (Op1Min == Op0Max - 1)
return new ICmpInst(ICmpInst::ICMP_EQ, Op0,		return new ICmpInst(ICmpInst::ICMP_EQ, Op0,
ConstantInt::get(Op1->getType(), Op1Min + 1));		ConstantInt::get(Op1->getType(), Op1Min + 1));
		// X >u C --> X != 0, if the number of zero bits in the bottom of X
		// exceeds the log2 of C.
		if (Op0Known.countMinTrailingZeros() >= Op1Min.getActiveBits())
		return new ICmpInst(ICmpInst::ICMP_NE, Op0,
		Constant::getNullValue(Op1->getType()));
}		}
break;		break;
}		}
case ICmpInst::ICMP_SLT:		case ICmpInst::ICMP_SLT:
if (Op0Max.slt(Op1Min)) // A <s B -> true if max(A) < min(C)		if (Op0Max.slt(Op1Min)) // A <s B -> true if max(A) < min(C)
return replaceInstUsesWith(I, ConstantInt::getTrue(I.getType()));		return replaceInstUsesWith(I, ConstantInt::getTrue(I.getType()));
if (Op0Min.sge(Op1Max)) // A <s B -> false if min(A) >= max(C)		if (Op0Min.sge(Op1Max)) // A <s B -> false if min(A) >= max(C)
return replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));		return replaceInstUsesWith(I, ConstantInt::getFalse(I.getType()));
▲ Show 20 Lines • Show All 867 Lines • Show Last 20 Lines