This is an archive of the discontinued LLVM Phabricator instance.

Paths

Table of Contentst

-
include/llvm/IR/
-
llvm/
-
IR/
-
Instructions.h
-
lib/
-
Analysis/
3
InstructionSimplify.cpp
-
IR/
2
ConstantFold.cpp
-
test/Transforms/InstCombine/
-
Transforms/
-
InstCombine/
-
fcmp.ll

Differential D7617

InstCombine: fix fold "fcmp x, undef" to account for NaN
ClosedPublic

Authored by mehdi_amini on Feb 13 2015, 9:55 AM.

Download Raw Diff

Details

Reviewers

chandlerc
majnemer
hfinkel

Commits

rGeb242a504161: InstCombine: fix fold "fcmp x, undef" to account for NaN

Summary

See the two test cases.

; Can fold fcmp with undef on one side by choosing NaN for the undef

; Can fold fcmp with undef on both side
; fcmp u_pred undef, undef -> true
; fcmp o_pred undef, undef -> false
; because whatever you choose for the first undef
; you can choose NaN for the other undef

Diff Detail

Event Timeline

mehdi_amini updated this revision to Diff 19904.Feb 13 2015, 9:55 AM

mehdi_amini retitled this revision from to InstCombine: cannot fold "fcmp x, undef" because x can be NaN.

mehdi_amini updated this object.

mehdi_amini edited the test plan for this revision. (Show Details)

mehdi_amini added reviewers: chandlerc, hfinkel.

mehdi_amini added a subscriber: Unknown Object (MLST).

I wonder if we could access the target machine specific info to know
if NaN are disabled?
Or what is the right way of getting the -enable-no-nans-fp-math in opt?

Check the fast-math flags on the the operand (call Op->getFastMathFlags()). The LangRef says:

LLVM IR floating-point binary ops (fadd, fsub, fmul, fdiv, frem) have the following flags that can set to enable otherwise unsafe floating point operations
...
nnan - No NaNs - Allow optimizations to assume the arguments and result are not NaN. Such optimizations are required to retain defined behavior over NaNs, but the value of the result is undefined.
...
fast - Fast - Allow algebraically equivalent transformations that may dramatically change results in floating point (e.g. reassociate). This flag implies all the others.

For constant values, you can call C->isNaN();

After more thought, I found out we can fold depending on if fcmp is or isn't ordered.

mehdi_amini retitled this revision from InstCombine: cannot fold "fcmp x, undef" because x can be NaN to InstCombine: fix fold "fcmp x, undef" to accound for NaN .Feb 21 2015, 1:07 PM

mehdi_amini updated this object.

Ping.

Ping. Can someone look at this InstCombine change?

CC-ing David who seems like he might be in a good position to review this.

majnemer added a subscriber: majnemer.Mar 2 2015, 4:04 PM

majnemer added inline comments.

lib/Analysis/InstructionSimplify.cpp
3044	It would be nice to have `LHS` on the left and `RHS` on the right. I think the comment would be clearer if it mentioned that this simplification will effect `fcmp pred undef, x` as well.
3045	Isn't `Pred` already a `CmpInst::Predicate`? What does this line achieve?
3047	s/fails/fail/
lib/IR/ConstantFold.cpp
1330	perhaps "use the standard constant folder."
1673–1675	Either move the `ICmpInst::isIntPredicate(Predicate) && isa<UndefValue>(C1) && isa<UndefValue>(C2)` check out of this block or simplify it with `ICmpInst::isIntPredicate(Predicate) && C1 == C2`, the line is getting a bit too long.

Update thanks to David's review.

LGTM

This revision is now accepted and ready to land.Mar 4 2015, 11:06 PM

mehdi_amini closed this revision.Mar 8 2015, 8:22 PM

Revision Contents

Path

Size

include/

llvm/

IR/

Instructions.h

10 lines

lib/

Analysis/

InstructionSimplify.cpp

9 lines

IR/

ConstantFold.cpp

27 lines

test/

Transforms/

InstCombine/

fcmp.ll

35 lines

Diff 20466

include/llvm/IR/Instructions.h

Show First 20 Lines • Show All 1,188 Lines • ▼ Show 20 Lines	assert(getOperand(0)->getType() == getOperand(1)->getType() &&
"Both operands to FCmp instruction are not of the same type!");		"Both operands to FCmp instruction are not of the same type!");
// Check that the operands are the right type		// Check that the operands are the right type
assert(getOperand(0)->getType()->isFPOrFPVectorTy() &&		assert(getOperand(0)->getType()->isFPOrFPVectorTy() &&
"Invalid operand types for FCmp instruction");		"Invalid operand types for FCmp instruction");
}		}

/// @returns true if the predicate of this instruction is EQ or NE.		/// @returns true if the predicate of this instruction is EQ or NE.
/// \brief Determine if this is an equality predicate.		/// \brief Determine if this is an equality predicate.
bool isEquality() const {		static bool isEquality(Predicate Pred) {
return getPredicate() == FCMP_OEQ \|\| getPredicate() == FCMP_ONE \|\|		return Pred == FCMP_OEQ \|\| Pred == FCMP_ONE \|\| Pred == FCMP_UEQ \|\|
getPredicate() == FCMP_UEQ \|\| getPredicate() == FCMP_UNE;		Pred == FCMP_UNE;
}		}

		/// @returns true if the predicate of this instruction is EQ or NE.
		/// \brief Determine if this is an equality predicate.
		bool isEquality() const { return isEquality(getPredicate()); }

/// @returns true if the predicate of this instruction is commutative.		/// @returns true if the predicate of this instruction is commutative.
/// \brief Determine if this is a commutative predicate.		/// \brief Determine if this is a commutative predicate.
bool isCommutative() const {		bool isCommutative() const {
return isEquality() \|\|		return isEquality() \|\|
getPredicate() == FCMP_FALSE \|\|		getPredicate() == FCMP_FALSE \|\|
getPredicate() == FCMP_TRUE \|\|		getPredicate() == FCMP_TRUE \|\|
getPredicate() == FCMP_ORD \|\|		getPredicate() == FCMP_ORD \|\|
getPredicate() == FCMP_UNO;		getPredicate() == FCMP_UNO;
▲ Show 20 Lines • Show All 2,612 Lines • Show Last 20 Lines

lib/Analysis/InstructionSimplify.cpp

Show First 20 Lines • Show All 3,034 Lines • ▼ Show 20 Lines	static Value SimplifyFCmpInst(unsigned Predicate, Value LHS, Value *RHS,
}		}

// Fold trivial predicates.		// Fold trivial predicates.
if (Pred == FCmpInst::FCMP_FALSE)		if (Pred == FCmpInst::FCMP_FALSE)
return ConstantInt::get(GetCompareTy(LHS), 0);		return ConstantInt::get(GetCompareTy(LHS), 0);
if (Pred == FCmpInst::FCMP_TRUE)		if (Pred == FCmpInst::FCMP_TRUE)
return ConstantInt::get(GetCompareTy(LHS), 1);		return ConstantInt::get(GetCompareTy(LHS), 1);

if (isa<UndefValue>(RHS)) // fcmp pred X, undef -> undef		// fcmp pred x, undef
return UndefValue::get(GetCompareTy(LHS));		if (isa<UndefValue>(RHS) \|\| isa<UndefValue>(LHS)) {
		majnemerUnsubmitted Not Done Reply Inline Actions It would be nice to have `LHS` on the left and `RHS` on the right. I think the comment would be clearer if it mentioned that this simplification will effect `fcmp pred undef, x` as well. majnemer: It would be nice to have `LHS` on the left and `RHS` on the right. I think the comment would…
		CmpInst::Predicate Predicate = CmpInst::Predicate(Pred);
		majnemerUnsubmitted Not Done Reply Inline Actions Isn't `Pred` already a `CmpInst::Predicate`? What does this line achieve? majnemer: Isn't `Pred` already a `CmpInst::Predicate`? What does this line achieve?
		// Choosing NaN for the undef will always make unordered comparison succeed
		// and ordered comparison fails.
		majnemerUnsubmitted Not Done Reply Inline Actions s/fails/fail/ majnemer: s/fails/fail/
		return ConstantInt::get(GetCompareTy(LHS), CmpInst::isUnordered(Predicate));
		}

// fcmp x,x -> true/false. Not all compares are foldable.		// fcmp x,x -> true/false. Not all compares are foldable.
if (LHS == RHS) {		if (LHS == RHS) {
if (CmpInst::isTrueWhenEqual(Pred))		if (CmpInst::isTrueWhenEqual(Pred))
return ConstantInt::get(GetCompareTy(LHS), 1);		return ConstantInt::get(GetCompareTy(LHS), 1);
if (CmpInst::isFalseWhenEqual(Pred))		if (CmpInst::isFalseWhenEqual(Pred))
return ConstantInt::get(GetCompareTy(LHS), 0);		return ConstantInt::get(GetCompareTy(LHS), 0);
}		}
▲ Show 20 Lines • Show All 772 Lines • Show Last 20 Lines

lib/IR/ConstantFold.cpp

Show First 20 Lines • Show All 1,321 Lines • ▼ Show 20 Lines	static FCmpInst::Predicate evaluateFCmpRelation(Constant V1, Constant V2) {
assert(V1->getType() == V2->getType() &&		assert(V1->getType() == V2->getType() &&
"Cannot compare values of different types!");		"Cannot compare values of different types!");

// Handle degenerate case quickly		// Handle degenerate case quickly
if (V1 == V2) return FCmpInst::FCMP_OEQ;		if (V1 == V2) return FCmpInst::FCMP_OEQ;

if (!isa<ConstantExpr>(V1)) {		if (!isa<ConstantExpr>(V1)) {
if (!isa<ConstantExpr>(V2)) {		if (!isa<ConstantExpr>(V2)) {
// We distilled thisUse the standard constant folder for a few cases		// We distilled this down to a simple case, use standard constant folder.
		majnemerUnsubmitted Not Done Reply Inline Actions perhaps "use the standard constant folder." majnemer: perhaps "use the standard constant folder."
ConstantInt *R = nullptr;		ConstantInt *R = nullptr;
R = dyn_cast<ConstantInt>(		R = dyn_cast<ConstantInt>(
ConstantExpr::getFCmp(FCmpInst::FCMP_OEQ, V1, V2));		ConstantExpr::getFCmp(FCmpInst::FCMP_OEQ, V1, V2));
if (R && !R->isZero())		if (R && !R->isZero())
return FCmpInst::FCMP_OEQ;		return FCmpInst::FCMP_OEQ;
R = dyn_cast<ConstantInt>(		R = dyn_cast<ConstantInt>(
ConstantExpr::getFCmp(FCmpInst::FCMP_OLT, V1, V2));		ConstantExpr::getFCmp(FCmpInst::FCMP_OLT, V1, V2));
if (R && !R->isZero())		if (R && !R->isZero())
▲ Show 20 Lines • Show All 321 Lines • ▼ Show 20 Lines	Constant *llvm::ConstantFoldCompareInstruction(unsigned short pred,
if (pred == FCmpInst::FCMP_FALSE)		if (pred == FCmpInst::FCMP_FALSE)
return Constant::getNullValue(ResultTy);		return Constant::getNullValue(ResultTy);

if (pred == FCmpInst::FCMP_TRUE)		if (pred == FCmpInst::FCMP_TRUE)
return Constant::getAllOnesValue(ResultTy);		return Constant::getAllOnesValue(ResultTy);

// Handle some degenerate cases first		// Handle some degenerate cases first
if (isa<UndefValue>(C1) \|\| isa<UndefValue>(C2)) {		if (isa<UndefValue>(C1) \|\| isa<UndefValue>(C2)) {
		CmpInst::Predicate Predicate = CmpInst::Predicate(pred);
// For EQ and NE, we can always pick a value for the undef to make the		// For EQ and NE, we can always pick a value for the undef to make the
// predicate pass or fail, so we can return undef.		// predicate pass or fail, so we can return undef.
// Also, if both operands are undef, we can return undef.		// Also, if both operands are undef, we can return undef for int comparison.
if (ICmpInst::isEquality(ICmpInst::Predicate(pred)) \|\|		if (ICmpInst::isEquality(Predicate) \|\|
(isa<UndefValue>(C1) && isa<UndefValue>(C2)))		(ICmpInst::isIntPredicate(Predicate) && isa<UndefValue>(C1) &&
		isa<UndefValue>(C2)))
return UndefValue::get(ResultTy);		return UndefValue::get(ResultTy);
		majnemerUnsubmitted Not Done Reply Inline Actions Either move the `ICmpInst::isIntPredicate(Predicate) && isa<UndefValue>(C1) && isa<UndefValue>(C2)` check out of this block or simplify it with `ICmpInst::isIntPredicate(Predicate) && C1 == C2`, the line is getting a bit too long. majnemer: Either move the `ICmpInst::isIntPredicate(Predicate) && isa<UndefValue>(C1) && isa<UndefValue>…
// Otherwise, pick the same value as the non-undef operand, and fold
// it to true or false.		// Otherwise, for integer compare, pick the same value as the non-undef
		// operand, and fold it to true or false.
		if (CmpInst::isIntPredicate(Predicate))
return ConstantInt::get(ResultTy, CmpInst::isTrueWhenEqual(pred));		return ConstantInt::get(ResultTy, CmpInst::isTrueWhenEqual(pred));

		// Choosing NaN for the undef will always make unordered comparison succeed
		// and ordered comparison fails.
		return ConstantInt::get(ResultTy, CmpInst::isUnordered(Predicate));
}		}

// icmp eq/ne(null,GV) -> false/true		// icmp eq/ne(null,GV) -> false/true
if (C1->isNullValue()) {		if (C1->isNullValue()) {
if (const GlobalValue *GV = dyn_cast<GlobalValue>(C2))		if (const GlobalValue *GV = dyn_cast<GlobalValue>(C2))
// Don't try to evaluate aliases. External weak GV can be null.		// Don't try to evaluate aliases. External weak GV can be null.
if (!isa<GlobalAlias>(GV) && !GV->hasExternalWeakLinkage()) {		if (!isa<GlobalAlias>(GV) && !GV->hasExternalWeakLinkage()) {
if (pred == ICmpInst::ICMP_EQ)		if (pred == ICmpInst::ICMP_EQ)
▲ Show 20 Lines • Show All 99 Lines • ▼ Show 20 Lines	for (unsigned i = 0, e = C1->getType()->getVectorNumElements(); i != e;++i){
ConstantExpr::getExtractElement(C2, ConstantInt::get(Ty, i));		ConstantExpr::getExtractElement(C2, ConstantInt::get(Ty, i));

ResElts.push_back(ConstantExpr::getCompare(pred, C1E, C2E));		ResElts.push_back(ConstantExpr::getCompare(pred, C1E, C2E));
}		}

return ConstantVector::get(ResElts);		return ConstantVector::get(ResElts);
}		}

if (C1->getType()->isFloatingPointTy()) {		if (C1->getType()->isFloatingPointTy() &&
		// Only call evaluateFCmpRelation is we have a constant expr to avoid
		// infinite recursive loop
		(isa<ConstantExpr>(C1) \|\| isa<ConstantExpr>(C2))) {
int Result = -1; // -1 = unknown, 0 = known false, 1 = known true.		int Result = -1; // -1 = unknown, 0 = known false, 1 = known true.
switch (evaluateFCmpRelation(C1, C2)) {		switch (evaluateFCmpRelation(C1, C2)) {
default: llvm_unreachable("Unknown relation!");		default: llvm_unreachable("Unknown relation!");
case FCmpInst::FCMP_UNO:		case FCmpInst::FCMP_UNO:
case FCmpInst::FCMP_ORD:		case FCmpInst::FCMP_ORD:
case FCmpInst::FCMP_UEQ:		case FCmpInst::FCMP_UEQ:
case FCmpInst::FCMP_UNE:		case FCmpInst::FCMP_UNE:
case FCmpInst::FCMP_ULT:		case FCmpInst::FCMP_ULT:
▲ Show 20 Lines • Show All 427 Lines • Show Last 20 Lines

test/Transforms/InstCombine/fcmp.ll

	Show First 20 Lines • Show All 234 Lines • ▼ Show 20 Lines

	; Don't crash.			; Don't crash.
	define i32 @test17(double %a, double (double)* %p) nounwind {			define i32 @test17(double %a, double (double)* %p) nounwind {
	%call = tail call double %p(double %a) nounwind			%call = tail call double %p(double %a) nounwind
	%cmp = fcmp ueq double %call, 0.000000e+00			%cmp = fcmp ueq double %call, 0.000000e+00
	%conv = zext i1 %cmp to i32			%conv = zext i1 %cmp to i32
	ret i32 %conv			ret i32 %conv
	}			}

				; Can fold fcmp with undef on one side by choosing NaN for the undef
				define i32 @test18_undef_unordered(float %a) nounwind {
				; CHECK-LABEL: @test18_undef_unordered
				; CHECK: ret i32 1
				%cmp = fcmp ueq float %a, undef
				%conv = zext i1 %cmp to i32
				ret i32 %conv
				}
				; Can fold fcmp with undef on one side by choosing NaN for the undef
				define i32 @test18_undef_ordered(float %a) nounwind {
				; CHECK-LABEL: @test18_undef_ordered
				; CHECK: ret i32 0
				%cmp = fcmp oeq float %a, undef
				%conv = zext i1 %cmp to i32
				ret i32 %conv
				}

				; Can fold fcmp with undef on both side
				; fcmp u_pred undef, undef -> true
				; fcmp o_pred undef, undef -> false
				; because whatever you choose for the first undef
				; you can choose NaN for the other undef
				define i1 @test19_undef_unordered() nounwind {
				; CHECK-LABEL: @test19_undef
				; CHECK: ret i1 true
				%cmp = fcmp ueq float undef, undef
				ret i1 %cmp
				}
				define i1 @test19_undef_ordered() nounwind {
				; CHECK-LABEL: @test19_undef
				; CHECK: ret i1 false
				%cmp = fcmp oeq float undef, undef
				ret i1 %cmp
				}