This is an archive of the discontinued LLVM Phabricator instance.

Paths

Table of Contentst

-
llvm/trunk/
-
trunk/
-
lib/Transforms/Utils/
-
Transforms/
-
Utils/
-
SimplifyLibCalls.cpp
-
test/Transforms/InstCombine/
-
Transforms/
-
InstCombine/
-
pow-1.ll

Differential D22104

[SimplifyLibCalls] pow(x, 0.5) -> fabs(sqrt(x)) (finite-only-mode)
AbandonedPublic

Authored by davide on Jul 7 2016, 11:48 AM.

Download Raw Diff

Details

Reviewers

spatel
majnemer
scanon

Commits

rG27da131f327b: [SLC] Emit an intrinsic instead of a libcall for pow.
rL277963: [SLC] Emit an intrinsic instead of a libcall for pow.

Summary

This is a new version of http://reviews.llvm.org/D16833 as mgrang has no more time to work on the feature.
This patch substantially differ from the previous version. The original patch applied the transformation if:
if (Op1C->getValueAPF().isFinite())

I don't think this is the correct way of checking we're in finite-mode only. Instead, checked that the function has the attributes no-nans-fp-math and no-infs-fp-math both set to true. I hope I wasn't entirely wrong in my analysis. In any case, comments welcome.

Also, this adds a test (which wasn't included in the original revision).

cc:ing Steve Canon so that he can confirm/deny if this makes sense from a mathematical point of view.

Diff Detail

Repository: rL LLVM

Event Timeline

davide updated this revision to Diff 63107.Jul 7 2016, 11:48 AM

davide retitled this revision from to [SimplifyLibCalls] pow(x, 0.5) -> fabs(sqrt(x)) (finite-only-mode).

davide updated this object.

davide added reviewers: majnemer, spatel, scanon.

davide added a subscriber: llvm-commits.

majnemer added inline comments.Jul 7 2016, 11:55 AM

lib/Transforms/Utils/SimplifyLibCalls.cpp
1071 ↗	(On Diff #63107)	Hmm. Why not check to see if the call-site is annotated with `ninf nnan`?

Like this or you meant something different?

ping

Also, maybe we can do this separately, but after discussing with Sanjay I concluded that maybe it's a good idea to emit intrinsics instead of libcalls here as optimizeSqrt() does? David, what do you think?

This doesn't preserve FMF across calls, need to modify to take that in account (thanks to Sanjay for the suggestion offline)

Sorry - didn't mean to back-channel a review. I just noticed that the test case starts with an LLVM intrinsic and ends with libcalls. That means we've artificially (if it's ok for scalars, then it's ok for vectors) excluded the vector variant of an 'llvm.pow' from this transform. There was also a proposal to change all libcalls to intrinsics when possible, so I think we're just creating extra work for that pass if we create libcalls here.

Possible changes to make this transform more general:

Switch the dyn_cast check for ConstantFP to "match(X, m_SpecificFP(0.5))" (this should work with a vector splat constant).
Use llvm.fabs/sqrt intrinsics so the transform works with vectors.
Check the 'nsz' FMF too; ie, for the case that James and Eli noted, 'nsz' should let us eliminate the fabs.

Closed by commit rL277963: [SLC] Emit an intrinsic instead of a libcall for pow. (authored by davide). · Explain WhyAug 7 2016, 1:35 PM

This revision was automatically updated to reflect the committed changes.

davide reopened this revision.Aug 7 2016, 1:37 PM

It's not obvious this transformation buys something, abandoning for now.

Revision Contents

Path

Size

llvm/

trunk/

lib/

Transforms/

Utils/

SimplifyLibCalls.cpp

22 lines

test/

Transforms/

InstCombine/

pow-1.ll

6 lines

Diff 67103

llvm/trunk/lib/Transforms/Utils/SimplifyLibCalls.cpp

	Show First 20 Lines • Show All 987 Lines • ▼ Show 20 Lines
	Value LibCallSimplifier::optimizePow(CallInst CI, IRBuilder<> &B) {			Value LibCallSimplifier::optimizePow(CallInst CI, IRBuilder<> &B) {
	Function *Callee = CI->getCalledFunction();			Function *Callee = CI->getCalledFunction();
	Value *Ret = nullptr;			Value *Ret = nullptr;
	StringRef Name = Callee->getName();			StringRef Name = Callee->getName();
	if (UnsafeFPShrink && Name == "pow" && hasFloatVersion(Name))			if (UnsafeFPShrink && Name == "pow" && hasFloatVersion(Name))
	Ret = optimizeUnaryDoubleFP(CI, B, true);			Ret = optimizeUnaryDoubleFP(CI, B, true);

	Value Op1 = CI->getArgOperand(0), Op2 = CI->getArgOperand(1);			Value Op1 = CI->getArgOperand(0), Op2 = CI->getArgOperand(1);
	if (ConstantFP *Op1C = dyn_cast<ConstantFP>(Op1)) {
	// pow(1.0, x) -> 1.0			// pow(1.0, x) -> 1.0
	if (Op1C->isExactlyValue(1.0))			if (match(Op1, m_SpecificFP(1.0)))
	return Op1C;			return Op1;
	// pow(2.0, x) -> exp2(x)			// pow(2.0, x) -> llvm.exp2(x)
	if (Op1C->isExactlyValue(2.0) &&			if (match(Op1, m_SpecificFP(2.0))) {
	hasUnaryFloatFn(TLI, Op1->getType(), LibFunc::exp2, LibFunc::exp2f,			Value *Exp2 = Intrinsic::getDeclaration(CI->getModule(), Intrinsic::exp2,
	LibFunc::exp2l))			CI->getType());
	return emitUnaryFloatFnCall(Op2, TLI->getName(LibFunc::exp2), B,			return B.CreateCall(Exp2, Op2, "exp2");
	Callee->getAttributes());			}

				// There's no llvm.exp10 intrinsic yet, but, maybe, some day there will
				// be one.
				if (ConstantFP *Op1C = dyn_cast<ConstantFP>(Op1)) {
	// pow(10.0, x) -> exp10(x)			// pow(10.0, x) -> exp10(x)
	if (Op1C->isExactlyValue(10.0) &&			if (Op1C->isExactlyValue(10.0) &&
	hasUnaryFloatFn(TLI, Op1->getType(), LibFunc::exp10, LibFunc::exp10f,			hasUnaryFloatFn(TLI, Op1->getType(), LibFunc::exp10, LibFunc::exp10f,
	LibFunc::exp10l))			LibFunc::exp10l))
	return emitUnaryFloatFnCall(Op2, TLI->getName(LibFunc::exp10), B,			return emitUnaryFloatFnCall(Op2, TLI->getName(LibFunc::exp10), B,
	Callee->getAttributes());			Callee->getAttributes());
	}			}

	▲ Show 20 Lines • Show All 1,336 Lines • Show Last 20 Lines

llvm/trunk/test/Transforms/InstCombine/pow-1.ll

	Show All 31 Lines
	; CHECK-NEXT: ret double 1.000000e+00			; CHECK-NEXT: ret double 1.000000e+00
	}			}

	; Check pow(2.0, x) -> exp2(x).			; Check pow(2.0, x) -> exp2(x).

	define float @test_simplify3(float %x) {			define float @test_simplify3(float %x) {
	; CHECK-LABEL: @test_simplify3(			; CHECK-LABEL: @test_simplify3(
	%retval = call float @powf(float 2.0, float %x)			%retval = call float @powf(float 2.0, float %x)
	; CHECK-NEXT: [[EXP2F:%[a-z0-9]+]] = call float @exp2f(float %x) [[NUW_RO:#[0-9]+]]			; CHECK-NEXT: [[EXP2F:%[a-z0-9]+]] = call float @llvm.exp2.f32(float %x)
	ret float %retval			ret float %retval
	; CHECK-NEXT: ret float [[EXP2F]]			; CHECK-NEXT: ret float [[EXP2F]]
	}			}

	define double @test_simplify4(double %x) {			define double @test_simplify4(double %x) {
	; CHECK-LABEL: @test_simplify4(			; CHECK-LABEL: @test_simplify4(
	%retval = call double @pow(double 2.0, double %x)			%retval = call double @pow(double 2.0, double %x)
	; CHECK-NEXT: [[EXP2:%[a-z0-9]+]] = call double @exp2(double %x) [[NUW_RO]]			; CHECK-NEXT: [[EXP2:%[a-z0-9]+]] = call double @llvm.exp2.f64(double %x)
	ret double %retval			ret double %retval
	; CHECK-NEXT: ret double [[EXP2]]			; CHECK-NEXT: ret double [[EXP2]]
	}			}

	; Check pow(x, 0.0) -> 1.0.			; Check pow(x, 0.0) -> 1.0.

	define float @test_simplify5(float %x) {			define float @test_simplify5(float %x) {
	; CHECK-LABEL: @test_simplify5(			; CHECK-LABEL: @test_simplify5(
	Show All 9 Lines
	; CHECK-NEXT: ret double 1.000000e+00			; CHECK-NEXT: ret double 1.000000e+00
	}			}

	; Check pow(x, 0.5) -> fabs(sqrt(x)), where x != -infinity.			; Check pow(x, 0.5) -> fabs(sqrt(x)), where x != -infinity.

	define float @test_simplify7(float %x) {			define float @test_simplify7(float %x) {
	; CHECK-LABEL: @test_simplify7(			; CHECK-LABEL: @test_simplify7(
	%retval = call float @powf(float %x, float 0.5)			%retval = call float @powf(float %x, float 0.5)
	; CHECK-NEXT: [[SQRTF:%[a-z0-9]+]] = call float @sqrtf(float %x) [[NUW_RO]]			; CHECK-NEXT: [[SQRTF:%[a-z0-9]+]] = call float @sqrtf(float %x) [[NUW_RO:#[0-9]+]]
	; CHECK-NEXT: [[FABSF:%[a-z0-9]+]] = call float @fabsf(float [[SQRTF]]) [[NUW_RO]]			; CHECK-NEXT: [[FABSF:%[a-z0-9]+]] = call float @fabsf(float [[SQRTF]]) [[NUW_RO]]
	; CHECK-NEXT: [[FCMP:%[a-z0-9]+]] = fcmp oeq float %x, 0xFFF0000000000000			; CHECK-NEXT: [[FCMP:%[a-z0-9]+]] = fcmp oeq float %x, 0xFFF0000000000000
	; CHECK-NEXT: [[SELECT:%[a-z0-9]+]] = select i1 [[FCMP]], float 0x7FF0000000000000, float [[FABSF]]			; CHECK-NEXT: [[SELECT:%[a-z0-9]+]] = select i1 [[FCMP]], float 0x7FF0000000000000, float [[FABSF]]
	ret float %retval			ret float %retval
	; CHECK-NEXT: ret float [[SELECT]]			; CHECK-NEXT: ret float [[SELECT]]
	}			}

	define double @test_simplify8(double %x) {			define double @test_simplify8(double %x) {
	▲ Show 20 Lines • Show All 112 Lines • Show Last 20 Lines