This is an archive of the discontinued LLVM Phabricator instance.

----------------------------------------
Optimization: zz
Precondition: ((C != 1) && (C != -128))
  %div = sdiv exact i8 %x, C
  %r = sub i8 0, %div
=>
  %r = sdiv exact i8 %x, -C

Done: 1
Optimization is correct!

llvm/test/Transforms/InstCombine/div.ll
762–763	Please add more tests. Variant with nsw, but without exact Variant without nsw, but with exact Variant without nsw, and without exact ??? Are there tests with C = 1, C = MinSigned ?

address comments

please precommit the tests

llvm/test/Transforms/InstCombine/div.ll
783	tests are faulty, contain `nsw` despite the name

address Roman's comments.

Thanks for your comments Roman @lebedev.ri . Updated.

llvm/test/Transforms/InstCombine/div.ll
783	oops. fixed.

llvm/test/Transforms/InstCombine/div.ll
809	test name is `@test_exact_nonsw_noexact`

This revision is now accepted and ready to land.Apr 8 2019, 3:34 AM

Closed by commit rL357904: [InstCombine] sdiv exact flag fixup. (authored by shchenz). · Explain WhyApr 8 2019, 5:06 AM

This revision was automatically updated to reflect the committed changes.

shchenz marked an inline comment as done.

lebedev.ri added inline comments.Apr 8 2019, 5:22 AM

llvm/trunk/lib/Transforms/InstCombine/InstCombineAddSub.cpp
1696 ↗	(On Diff #194116)	Uhm. So, this is not related to this patch specifically, but i think `isOneValue()` check is incorrect, and may be causing miscompiles: https://godbolt.org/z/CmAslh <- i don't think `@test_exact_vec` should be folded? I think you want to add a `isNotOneValue()`. Also, is this fold valid for `undef` elements? CC @spatel

spatel added inline comments.Apr 8 2019, 6:00 AM

llvm/trunk/lib/Transforms/InstCombine/InstCombineAddSub.cpp
1696 ↗	(On Diff #194116)	Yes, if this patch has not been reverted yet, it probably should be. It's not correct for arbitrary vector constants. We can either limit this to splat constants (m_APInt) or do the more involved element-by-element check. If the divisor has an undef element, we have immediate UB, so anything goes. But we might want to do something better? I haven't looked at this patch closely yet.

lebedev.ri added inline comments.Apr 8 2019, 6:24 AM

llvm/trunk/lib/Transforms/InstCombine/InstCombineAddSub.cpp
1696 ↗	(On Diff #194116)	Note that this patch only fixed propagation of `exact`. I'm wondering if the entire fold is broken for vectors w/`undef` elts.

lebedev.ri added inline comments.Apr 8 2019, 6:26 AM

llvm/trunk/lib/Transforms/InstCombine/InstCombineAddSub.cpp
1696 ↗	(On Diff #194116)	... and it won't be possible to revert the original patch, since it is here for 9+ years. So i think this fold should be fixed instead.

nikic added a subscriber: nikic.Apr 8 2019, 6:33 AM

spatel added inline comments.Apr 8 2019, 6:34 AM

llvm/trunk/lib/Transforms/InstCombine/InstCombineAddSub.cpp
1696 ↗	(On Diff #194116)	Ah, sorry - didn't see it clearly the 1st time. Yes, I agree the bug was already there, so we just need to fix it as a follow-up. Do you or @shchenz want to write that patch?

lebedev.ri added inline comments.Apr 8 2019, 6:36 AM

llvm/trunk/lib/Transforms/InstCombine/InstCombineAddSub.cpp
1696 ↗	(On Diff #194116)	Filed https://bugs.llvm.org/show_bug.cgi?id=41425

shchenz marked an inline comment as done.Apr 8 2019, 6:42 AM

shchenz added inline comments.

llvm/test/Transforms/InstCombine/div.ll
809	fixed.
llvm/trunk/lib/Transforms/InstCombine/InstCombineAddSub.cpp
1696 ↗	(On Diff #194116)	thanks for pointing out this bug. I am afraid I don't have time for this issue now.

Revision Contents

Path

Size

llvm/

lib/

Transforms/

InstCombine/

InstCombineAddSub.cpp

7 lines

test/

Transforms/

InstCombine/

div.ll

6 lines

Diff 194107

llvm/lib/Transforms/InstCombine/InstCombineAddSub.cpp

Show First 20 Lines • Show All 1,687 Lines • ▼ Show 20 Lines	if (Op1->hasOneUse()) {

// (X - (X & Y)) --> (X & ~Y)		// (X - (X & Y)) --> (X & ~Y)
if (match(Op1, m_c_And(m_Value(Y), m_Specific(Op0))))		if (match(Op1, m_c_And(m_Value(Y), m_Specific(Op0))))
return BinaryOperator::CreateAnd(Op0,		return BinaryOperator::CreateAnd(Op0,
Builder.CreateNot(Y, Y->getName() + ".not"));		Builder.CreateNot(Y, Y->getName() + ".not"));

// 0 - (X sdiv C) -> (X sdiv -C) provided the negation doesn't overflow.		// 0 - (X sdiv C) -> (X sdiv -C) provided the negation doesn't overflow.
if (match(Op1, m_SDiv(m_Value(X), m_Constant(C))) && match(Op0, m_Zero()) &&		if (match(Op1, m_SDiv(m_Value(X), m_Constant(C))) && match(Op0, m_Zero()) &&
C->isNotMinSignedValue() && !C->isOneValue())		C->isNotMinSignedValue() && !C->isOneValue()) {
return BinaryOperator::CreateSDiv(X, ConstantExpr::getNeg(C));		auto *BO = BinaryOperator::CreateSDiv(X, ConstantExpr::getNeg(C));
		BO->setIsExact(cast<BinaryOperator>(Op1)->isExact());
		return BO;
		}

// 0 - (X << Y) -> (-X << Y) when X is freely negatable.		// 0 - (X << Y) -> (-X << Y) when X is freely negatable.
if (match(Op1, m_Shl(m_Value(X), m_Value(Y))) && match(Op0, m_Zero()))		if (match(Op1, m_Shl(m_Value(X), m_Value(Y))) && match(Op0, m_Zero()))
if (Value *XNeg = dyn_castNegVal(X))		if (Value *XNeg = dyn_castNegVal(X))
return BinaryOperator::CreateShl(XNeg, Y);		return BinaryOperator::CreateShl(XNeg, Y);

// Subtracting -1/0 is the same as adding 1/0:		// Subtracting -1/0 is the same as adding 1/0:
// sub [nsw] Op0, sext(bool Y) -> add [nsw] Op0, zext(bool Y)		// sub [nsw] Op0, sext(bool Y) -> add [nsw] Op0, zext(bool Y)
▲ Show 20 Lines • Show All 214 Lines • Show Last 20 Lines

llvm/test/Transforms/InstCombine/div.ll

	Show First 20 Lines • Show All 753 Lines • ▼ Show 20 Lines
	; CHECK-NEXT: [[C:%.*]] = udiv <2 x i8> [[A]], [[B]]			; CHECK-NEXT: [[C:%.*]] = udiv <2 x i8> [[A]], [[B]]
	; CHECK-NEXT: ret <2 x i8> [[C]]			; CHECK-NEXT: ret <2 x i8> [[C]]
	;			;
	%a = mul nuw <2 x i8> %z, %x			%a = mul nuw <2 x i8> %z, %x
	%b = mul <2 x i8> %z, %y			%b = mul <2 x i8> %z, %y
	%c = udiv <2 x i8> %a, %b			%c = udiv <2 x i8> %a, %b
	ret <2 x i8> %c			ret <2 x i8> %c
	}			}

	define i32 @test_exact_nsw_exact(i32 %x) {			define i32 @test_exact_nsw_exact(i32 %x) {
				lebedev.riUnsubmitted Not Done Reply Inline Actions Please add more tests. Variant with nsw, but without exact Variant without nsw, but with exact Variant without nsw, and without exact ??? Are there tests with C = 1, C = MinSigned ? lebedev.ri: Please add more tests. * Variant with nsw, but without exact * Variant without nsw, but with…
	; CHECK-LABEL: @test_exact_nsw_exact(			; CHECK-LABEL: @test_exact_nsw_exact(
	; CHECK-NEXT: [[NEG:%.]] = sdiv i32 [[X:%.]], -3			; CHECK-NEXT: [[NEG:%.]] = sdiv exact i32 [[X:%.]], -3
	; CHECK-NEXT: ret i32 [[NEG]]			; CHECK-NEXT: ret i32 [[NEG]]
	;			;
	%div = sdiv exact i32 %x, 3			%div = sdiv exact i32 %x, 3
	%neg = sub nsw i32 0, %div			%neg = sub nsw i32 0, %div
	ret i32 %neg			ret i32 %neg
	}			}

	define <2 x i64> @test_exact_vec(<2 x i64> %x) {			define <2 x i64> @test_exact_vec(<2 x i64> %x) {
	; CHECK-LABEL: @test_exact_vec(			; CHECK-LABEL: @test_exact_vec(
	; CHECK-NEXT: [[NEG:%.]] = sdiv <2 x i64> [[X:%.]], <i64 -3, i64 -4>			; CHECK-NEXT: [[NEG:%.]] = sdiv exact <2 x i64> [[X:%.]], <i64 -3, i64 -4>
	; CHECK-NEXT: ret <2 x i64> [[NEG]]			; CHECK-NEXT: ret <2 x i64> [[NEG]]
	;			;
	%div = sdiv exact <2 x i64> %x, <i64 3, i64 4>			%div = sdiv exact <2 x i64> %x, <i64 3, i64 4>
	%neg = sub nsw <2 x i64> zeroinitializer, %div			%neg = sub nsw <2 x i64> zeroinitializer, %div
	ret <2 x i64> %neg			ret <2 x i64> %neg
	}			}

	define i32 @test_exact_nonsw_exact(i32 %x) {			define i32 @test_exact_nonsw_exact(i32 %x) {
				lebedev.riUnsubmitted Not Done Reply Inline Actions tests are faulty, contain `nsw` despite the name lebedev.ri: tests are faulty, contain `nsw` despite the name
				shchenzAuthorUnsubmitted Done Reply Inline Actions oops. fixed. shchenz: oops. fixed.
	; CHECK-LABEL: @test_exact_nonsw_exact(			; CHECK-LABEL: @test_exact_nonsw_exact(
	; CHECK-NEXT: [[NEG:%.]] = sdiv i32 [[X:%.]], -3			; CHECK-NEXT: [[NEG:%.]] = sdiv exact i32 [[X:%.]], -3
	; CHECK-NEXT: ret i32 [[NEG]]			; CHECK-NEXT: ret i32 [[NEG]]
	;			;
	%div = sdiv exact i32 %x, 3			%div = sdiv exact i32 %x, 3
	%neg = sub i32 0, %div			%neg = sub i32 0, %div
	ret i32 %neg			ret i32 %neg
	}			}

	define i32 @test_exact_nsw_noexact(i32 %x) {			define i32 @test_exact_nsw_noexact(i32 %x) {
	; CHECK-LABEL: @test_exact_nsw_noexact(			; CHECK-LABEL: @test_exact_nsw_noexact(
	; CHECK-NEXT: [[NEG:%.]] = sdiv i32 [[X:%.]], -3			; CHECK-NEXT: [[NEG:%.]] = sdiv i32 [[X:%.]], -3
	; CHECK-NEXT: ret i32 [[NEG]]			; CHECK-NEXT: ret i32 [[NEG]]
	;			;
	%div = sdiv i32 %x, 3			%div = sdiv i32 %x, 3
	%neg = sub nsw i32 0, %div			%neg = sub nsw i32 0, %div
	ret i32 %neg			ret i32 %neg
	}			}

	define i32 @test_exact_nonsw_noexact(i32 %x) {			define i32 @test_exact_nonsw_noexact(i32 %x) {
	; CHECK-LABEL: @test_exact_nonsw_noexact(			; CHECK-LABEL: @test_exact_nonsw_noexact(
	; CHECK-NEXT: [[NEG:%.]] = sdiv i32 [[X:%.]], -3			; CHECK-NEXT: [[NEG:%.]] = sdiv i32 [[X:%.]], -3
	; CHECK-NEXT: ret i32 [[NEG]]			; CHECK-NEXT: ret i32 [[NEG]]
	;			;
	%div = sdiv i32 %x, 3			%div = sdiv i32 %x, 3
	%neg = sub nsw i32 0, %div			%neg = sub nsw i32 0, %div
				lebedev.riUnsubmitted Not Done Reply Inline Actions test name is `@test_exact_nonsw_noexact` lebedev.ri: test name is `@test_exact_nonsw_noexact`
				shchenzAuthorUnsubmitted Done Reply Inline Actions fixed. shchenz: fixed.
	ret i32 %neg			ret i32 %neg
	}			}

	define i32 @test_exact_div_nonconst(i32 %x, i32 %y) {			define i32 @test_exact_div_nonconst(i32 %x, i32 %y) {
	; CHECK-LABEL: @test_exact_div_nonconst(			; CHECK-LABEL: @test_exact_div_nonconst(
	; CHECK-NEXT: [[DIV:%.]] = sdiv exact i32 [[X:%.]], [[Y:%.*]]			; CHECK-NEXT: [[DIV:%.]] = sdiv exact i32 [[X:%.]], [[Y:%.*]]
	; CHECK-NEXT: [[NEG:%.*]] = sub nsw i32 0, [[DIV]]			; CHECK-NEXT: [[NEG:%.*]] = sub nsw i32 0, [[DIV]]
	; CHECK-NEXT: ret i32 [[NEG]]			; CHECK-NEXT: ret i32 [[NEG]]
	Show All 26 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[InstCombine] sdiv exact flag fixupClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 194107

llvm/lib/Transforms/InstCombine/InstCombineAddSub.cpp

llvm/test/Transforms/InstCombine/div.ll

[InstCombine] sdiv exact flag fixup
ClosedPublic