This is an archive of the discontinued LLVM Phabricator instance.

Paths

Table of Contentst

-
llvm/
-
lib/Transforms/InstCombine/
-
Transforms/
-
InstCombine/
-
InstCombineAddSub.cpp
-
InstCombineInternal.h
-
test/Transforms/InstCombine/
-
Transforms/
-
InstCombine/
3/3
sub-gep.ll

Differential D72048

[InstCombine] Preserve nuw on sub of geps (PR44419)
ClosedPublic

Authored by nikic on Jan 1 2020, 2:19 AM.

Download Raw Diff

Details

Reviewers

spatel
lebedev.ri
RKSimon
reames
nlopes

Commits

rG0e322c8a1f20: [InstCombine] Preserve nuw on sub of geps (PR44419)

Summary

Fix https://bugs.llvm.org/show_bug.cgi?id=44419 by preserving the nuw on sub of geps. We only do this for the simple case where we have one non-swapped gep. We could also preserve some information for the two gep case, but this would be more complicated.

Diff Detail

Repository: rG LLVM Github Monorepo

Event Timeline

nikic created this revision.Jan 1 2020, 2:19 AM

Herald added a project: Restricted Project. · View Herald TranscriptJan 1 2020, 2:19 AM

Herald added subscribers: llvm-commits, hiraditya. · View Herald Transcript

Thank you for looking into this.

llvm/test/Transforms/InstCombine/sub-gep.ll

30–41

----------------------------------------
define i64 @test_nuw(* %base, i64 %idx) {
%0:
  %p1 = gep * %base, 0 x i64 0, 4 x i64 0
  %p2 = gep * %base, 0 x i64 0, 4 x i64 %idx
  %i1 = ptrtoint * %p1 to i64
  %i2 = ptrtoint * %p2 to i64
  %d = sub nuw i64 %i2, %i1
  ret i64 %d
}
=>
define i64 @test_nuw(* %base, i64 %idx) {
%0:
  %P2_IDX = shl nuw i64 %idx, 2
  ret i64 %P2_IDX
}
Transformation doesn't verify!
ERROR: Target is more poisonous than source

Example:
* %base = null
i64 %idx = undef

Source:
* %p1 = null
* %p2 = null    [based on undef value]
i64 %i1 = #x0000000000000000 (0)
i64 %i2 = #x0000000000000000 (0)
i64 %d = #x0000000000000000 (0)

Target:
i64 %P2_IDX = poison
Source value: #x0000000000000000 (0)
Target value: poison

Summary:
  0 correct transformations
  1 incorrect transformations
  0 errors

This revision now requires changes to proceed.Jan 1 2020, 2:36 AM

Only add nuw if the gep is also inbounds.

nikic marked 2 inline comments as done.Jan 1 2020, 3:11 AM

nikic added inline comments.

llvm/test/Transforms/InstCombine/sub-gep.ll
30–41	Thanks for catching this! To give a more specific example, if %base=0 and %idx has only the top bit set, then %p1 and %p2 will both be zero and the original sub is nuw, but shifting the %idx is not nuw.

I think this is still not quite right for the case where there are multiple GEP indexes. For example:

define i64 @test_inbounds_nuw_multi_index([0 x [2 x i32]]* %base, i64 %idx, i64 %idx2) {
; CHECK-LABEL: @test_inbounds_nuw_multi_index(
; CHECK-NEXT:    [[P2_IDX:%.*]] = shl nuw nsw i64 [[IDX:%.*]], 3
; CHECK-NEXT:    [[P2_IDX1:%.*]] = shl nuw nsw i64 [[IDX2:%.*]], 2
; CHECK-NEXT:    [[P2_OFFS2:%.*]] = add i64 [[P2_IDX]], [[P2_IDX1]]
; CHECK-NEXT:    ret i64 [[P2_OFFS2]]
;
  %p1 = getelementptr inbounds [0 x [2 x i32]], [0 x [2 x i32]]* %base, i64 0, i64 0, i64 0
  %p2 = getelementptr inbounds [0 x [2 x i32]], [0 x [2 x i32]]* %base, i64 0, i64 %idx, i64 %idx2
  %i1 = ptrtoint i32* %p1 to i64
  %i2 = ptrtoint i32* %p2 to i64
  %d = sub nuw i64 %i2, %i1
  ret i64 %d
}

Let's say %idx=-1, %idx2=4, then the overall result is 8 * %idx1 + 4 * %idx2 = 8, which is positive, even though one of the intermediate indexes is negative and as such can't use shl nuw. I think in this case the nuw can't be on any of the instructions (including also not the add). Right?

In D72048#1800331, @nikic wrote:
I think this is still not quite right for the case where there are multiple GEP indexes. For example:
define i64 @test_inbounds_nuw_multi_index([0 x [2 x i32]]* %base, i64 %idx, i64 %idx2) {
; CHECK-LABEL: @test_inbounds_nuw_multi_index(
; CHECK-NEXT:    [[P2_IDX:%.*]] = shl nuw nsw i64 [[IDX:%.*]], 3
; CHECK-NEXT:    [[P2_IDX1:%.*]] = shl nuw nsw i64 [[IDX2:%.*]], 2
; CHECK-NEXT:    [[P2_OFFS2:%.*]] = add i64 [[P2_IDX]], [[P2_IDX1]]
; CHECK-NEXT:    ret i64 [[P2_OFFS2]]
;
  %p1 = getelementptr inbounds [0 x [2 x i32]], [0 x [2 x i32]]* %base, i64 0, i64 0, i64 0
  %p2 = getelementptr inbounds [0 x [2 x i32]], [0 x [2 x i32]]* %base, i64 0, i64 %idx, i64 %idx2
  %i1 = ptrtoint i32* %p1 to i64
  %i2 = ptrtoint i32* %p2 to i64
  %d = sub nuw i64 %i2, %i1
  ret i64 %d
}
Let's say %idx=-1, %idx2=4, then the overall result is 8 * %idx1 + 4 * %idx2 = 8, which is positive, even though one of the intermediate indexes is negative and as such can't use shl nuw. I think in this case the nuw can't be on any of the instructions (including also not the add). Right?

Sure.

----------------------------------------
define i64 @test_inbounds_nuw_multi_index(* %base, i64 %idx, i64 %idx2) {
%0:
  %p1 = gep inbounds * %base, 0 x i64 0, 8 x i64 0, 4 x i64 0
  %p2 = gep inbounds * %base, 0 x i64 0, 8 x i64 %idx, 4 x i64 %idx2
  %i1 = ptrtoint * %p1 to i64
  %i2 = ptrtoint * %p2 to i64
  %d = sub nuw i64 %i2, %i1
  ret i64 %d
}
=>
define i64 @test_inbounds_nuw_multi_index(* %base, i64 %idx, i64 %idx2) {
%0:
  %P2_IDX = shl nsw nuw i64 %idx, 3
  %P2_IDX1 = shl nsw nuw i64 %idx2, 2
  %P2_OFFS2 = add i64 %P2_IDX, %P2_IDX1
  ret i64 %P2_OFFS2
}
Transformation doesn't verify!
ERROR: Target is more poisonous than source

Example:
* %base = pointer(non-local, block_id=1, offset=498773658766409739)
i64 %idx = #x0322800007800000 (225883668936130560)
i64 %idx2 = #xfa00000000000000 (18014398509481984000, -432345564227567616)

Source:
* %p1 = pointer(non-local, block_id=1, offset=498773658766409739)
* %p2 = pointer(non-local, block_id=1, offset=576460753345183755)
i64 %i1 = #x171bffffc3ffffff (1665205961213607935)
i64 %i2 = #x182fffffffffffff (1742893055792381951)
i64 %d = #x011400003c000000 (77687094578774016)

Target:
i64 %P2_IDX = #x191400003c000000 (1807069351489044480)
i64 %P2_IDX1 = poison
i64 %P2_OFFS2 = poison
Source value: #x011400003c000000 (77687094578774016)
Target value: poison

Summary:
  0 correct transformations
  1 incorrect transformations
  0 errors

----------------------------------------
define i64 @test_inbounds_nuw_multi_index(* %base, i64 %idx, i64 %idx2) {
%0:
  %p1 = gep inbounds * %base, 0 x i64 0, 8 x i64 0, 4 x i64 0
  %p2 = gep inbounds * %base, 0 x i64 0, 8 x i64 %idx, 4 x i64 %idx2
  %i1 = ptrtoint * %p1 to i64
  %i2 = ptrtoint * %p2 to i64
  %d = sub nuw i64 %i2, %i1
  ret i64 %d
}
=>
define i64 @test_inbounds_nuw_multi_index(* %base, i64 %idx, i64 %idx2) {
%0:
  %P2_IDX = shl nsw i64 %idx, 3
  %P2_IDX1 = shl nsw i64 %idx2, 2
  %P2_OFFS2 = add i64 %P2_IDX, %P2_IDX1
  ret i64 %P2_OFFS2
}
Transformation seems to be correct!

Summary:
  1 correct transformations
  0 incorrect transformations
  0 errors

alex added a subscriber: alex.Jan 1 2020, 5:40 AM

Fun fact: If you change https://github.com/llvm/llvm-project/blob/773667b8c20d35c18334f8c7663df8ceacfdd2e5/llvm/include/llvm/Analysis/Utils/Local.h#L92 to not emit a useless add 0, %x you get a regression in https://github.com/llvm/llvm-project/blob/773667b8c20d35c18334f8c7663df8ceacfdd2e5/llvm/test/Transforms/InstCombine/icmp.ll#L513-L524, because IRBuilder instructions get inserted into the InstCombine worklist in the wrong order :(

Only add nuw to final mul.

As the scope of this optimization turned out to be a lot smaller than I originally expected, I've moved this as a fixup operation in OptimizePointerDifference(), instead of directly emitting the nuw flag in EmitGEPOffset(), which is somewhat tricky to do.

The code is slightly odd due to the need to match the zero add, which I wasn't able to simply drop for the reason mentioned above.

RKSimon added reviewers: reames, nlopes.Jan 2 2020, 10:45 AM

Ping

Not really familiar with this code.
This seems correct to me, but maybe i'm missing some subtlety.

llvm/test/Transforms/InstCombine/sub-gep.ll
88	Precommit this?

This revision is now accepted and ready to land.Jan 8 2020, 2:54 PM

Closed by commit rG0e322c8a1f20: [InstCombine] Preserve nuw on sub of geps (PR44419) (authored by nikic). · Explain WhyJan 11 2020, 2:04 AM

This revision was automatically updated to reflect the committed changes.

nikic marked an inline comment as done.

Revision Contents

Path

Size

llvm/

lib/

Transforms/

InstCombine/

InstCombineAddSub.cpp

17 lines

InstCombineInternal.h

3 lines

test/

Transforms/

InstCombine/

sub-gep.ll

2 lines

Diff 237488

llvm/lib/Transforms/InstCombine/InstCombineAddSub.cpp

Show First 20 Lines • Show All 1,579 Lines • ▼ Show 20 Lines	Instruction *InstCombiner::visitFAdd(BinaryOperator &I) {

return nullptr;		return nullptr;
}		}

/// Optimize pointer differences into the same array into a size. Consider:		/// Optimize pointer differences into the same array into a size. Consider:
/// &A[10] - &A[0]: we should compile this to "10". LHS/RHS are the pointer		/// &A[10] - &A[0]: we should compile this to "10". LHS/RHS are the pointer
/// operands to the ptrtoint instructions for the LHS/RHS of the subtract.		/// operands to the ptrtoint instructions for the LHS/RHS of the subtract.
Value InstCombiner::OptimizePointerDifference(Value LHS, Value *RHS,		Value InstCombiner::OptimizePointerDifference(Value LHS, Value *RHS,
Type *Ty) {		Type *Ty, bool IsNUW) {
// If LHS is a gep based on RHS or RHS is a gep based on LHS, we can optimize		// If LHS is a gep based on RHS or RHS is a gep based on LHS, we can optimize
// this.		// this.
bool Swapped = false;		bool Swapped = false;
GEPOperator GEP1 = nullptr, GEP2 = nullptr;		GEPOperator GEP1 = nullptr, GEP2 = nullptr;

// For now we require one side to be the base pointer "A" or a constant		// For now we require one side to be the base pointer "A" or a constant
// GEP derived from it.		// GEP derived from it.
if (GEPOperator *LHSGEP = dyn_cast<GEPOperator>(LHS)) {		if (GEPOperator *LHSGEP = dyn_cast<GEPOperator>(LHS)) {
▲ Show 20 Lines • Show All 51 Lines • ▼ Show 20 Lines	if (NumNonConstantIndices1 + NumNonConstantIndices2 > 1 &&
(NumNonConstantIndices2 > 0 && !GEP2->hasOneUse()))) {		(NumNonConstantIndices2 > 0 && !GEP2->hasOneUse()))) {
return nullptr;		return nullptr;
}		}
}		}

// Emit the offset of the GEP and an intptr_t.		// Emit the offset of the GEP and an intptr_t.
Value *Result = EmitGEPOffset(GEP1);		Value *Result = EmitGEPOffset(GEP1);

		// If this is a single inbounds GEP and the original sub was nuw,
		// then the final multiplication is also nuw. We match an extra add zero
		// here, because that's what EmitGEPOffset() generates.
		Instruction *I;
		if (IsNUW && !GEP2 && !Swapped && GEP1->isInBounds() &&
		match(Result, m_Add(m_Instruction(I), m_Zero())) &&
		I->getOpcode() == Instruction::Mul)
		I->setHasNoUnsignedWrap();

// If we had a constant expression GEP on the other side offsetting the		// If we had a constant expression GEP on the other side offsetting the
// pointer, subtract it from the offset we have.		// pointer, subtract it from the offset we have.
if (GEP2) {		if (GEP2) {
Value *Offset = EmitGEPOffset(GEP2);		Value *Offset = EmitGEPOffset(GEP2);
Result = Builder.CreateSub(Result, Offset);		Result = Builder.CreateSub(Result, Offset);
}		}

// If we have p - gep(p, ...) then we have to negate the result.		// If we have p - gep(p, ...) then we have to negate the result.
▲ Show 20 Lines • Show All 382 Lines • ▼ Show 20 Lines	if (Op1->hasOneUse()) {
}		}
}		}

// Optimize pointer differences into the same array into a size. Consider:		// Optimize pointer differences into the same array into a size. Consider:
// &A[10] - &A[0]: we should compile this to "10".		// &A[10] - &A[0]: we should compile this to "10".
Value LHSOp, RHSOp;		Value LHSOp, RHSOp;
if (match(Op0, m_PtrToInt(m_Value(LHSOp))) &&		if (match(Op0, m_PtrToInt(m_Value(LHSOp))) &&
match(Op1, m_PtrToInt(m_Value(RHSOp))))		match(Op1, m_PtrToInt(m_Value(RHSOp))))
if (Value *Res = OptimizePointerDifference(LHSOp, RHSOp, I.getType()))		if (Value *Res = OptimizePointerDifference(LHSOp, RHSOp, I.getType(),
		I.hasNoUnsignedWrap()))
return replaceInstUsesWith(I, Res);		return replaceInstUsesWith(I, Res);

// trunc(p)-trunc(q) -> trunc(p-q)		// trunc(p)-trunc(q) -> trunc(p-q)
if (match(Op0, m_Trunc(m_PtrToInt(m_Value(LHSOp)))) &&		if (match(Op0, m_Trunc(m_PtrToInt(m_Value(LHSOp)))) &&
match(Op1, m_Trunc(m_PtrToInt(m_Value(RHSOp)))))		match(Op1, m_Trunc(m_PtrToInt(m_Value(RHSOp)))))
if (Value *Res = OptimizePointerDifference(LHSOp, RHSOp, I.getType()))		if (Value *Res = OptimizePointerDifference(LHSOp, RHSOp, I.getType(),
		/* IsNUW */ false))
return replaceInstUsesWith(I, Res);		return replaceInstUsesWith(I, Res);

// Canonicalize a shifty way to code absolute value to the common pattern.		// Canonicalize a shifty way to code absolute value to the common pattern.
// There are 2 potential commuted variants.		// There are 2 potential commuted variants.
// We're relying on the fact that we only do this transform when the shift has		// We're relying on the fact that we only do this transform when the shift has
// exactly 2 uses and the xor has exactly 1 use (otherwise, we might increase		// exactly 2 uses and the xor has exactly 1 use (otherwise, we might increase
// instructions).		// instructions).
Value *A;		Value *A;
▲ Show 20 Lines • Show All 212 Lines • Show Last 20 Lines

llvm/lib/Transforms/InstCombine/InstCombineInternal.h

Show First 20 Lines • Show All 363 Lines • ▼ Show 20 Lines	public:
// Return Value:		// Return Value:
// null - No change was made		// null - No change was made
// I - Change was made, I is still valid, I may be dead though		// I - Change was made, I is still valid, I may be dead though
// otherwise - Change was made, replace I with returned instruction		// otherwise - Change was made, replace I with returned instruction
//		//
Instruction *visitFNeg(UnaryOperator &I);		Instruction *visitFNeg(UnaryOperator &I);
Instruction *visitAdd(BinaryOperator &I);		Instruction *visitAdd(BinaryOperator &I);
Instruction *visitFAdd(BinaryOperator &I);		Instruction *visitFAdd(BinaryOperator &I);
Value OptimizePointerDifference(Value LHS, Value RHS, Type Ty);		Value *OptimizePointerDifference(
		Value LHS, Value RHS, Type *Ty, bool isNUW);
Instruction *visitSub(BinaryOperator &I);		Instruction *visitSub(BinaryOperator &I);
Instruction *visitFSub(BinaryOperator &I);		Instruction *visitFSub(BinaryOperator &I);
Instruction *visitMul(BinaryOperator &I);		Instruction *visitMul(BinaryOperator &I);
Instruction *visitFMul(BinaryOperator &I);		Instruction *visitFMul(BinaryOperator &I);
Instruction *visitURem(BinaryOperator &I);		Instruction *visitURem(BinaryOperator &I);
Instruction *visitSRem(BinaryOperator &I);		Instruction *visitSRem(BinaryOperator &I);
Instruction *visitFRem(BinaryOperator &I);		Instruction *visitFRem(BinaryOperator &I);
bool simplifyDivRemOfSelectWithZeroOp(BinaryOperator &I);		bool simplifyDivRemOfSelectWithZeroOp(BinaryOperator &I);
▲ Show 20 Lines • Show All 627 Lines • Show Last 20 Lines

llvm/test/Transforms/InstCombine/sub-gep.ll

Show All 10 Lines	;
%i1 = ptrtoint i32* %p1 to i64		%i1 = ptrtoint i32* %p1 to i64
%i2 = ptrtoint i32* %p2 to i64		%i2 = ptrtoint i32* %p2 to i64
%d = sub i64 %i2, %i1		%d = sub i64 %i2, %i1
ret i64 %d		ret i64 %d
}		}

define i64 @test_inbounds_nuw([0 x i32]* %base, i64 %idx) {		define i64 @test_inbounds_nuw([0 x i32]* %base, i64 %idx) {
; CHECK-LABEL: @test_inbounds_nuw(		; CHECK-LABEL: @test_inbounds_nuw(
; CHECK-NEXT: [[P2_IDX:%.]] = shl nsw i64 [[IDX:%.]], 2		; CHECK-NEXT: [[P2_IDX:%.]] = shl nuw nsw i64 [[IDX:%.]], 2
; CHECK-NEXT: ret i64 [[P2_IDX]]		; CHECK-NEXT: ret i64 [[P2_IDX]]
;		;
%p1 = getelementptr inbounds [0 x i32], [0 x i32]* %base, i64 0, i64 0		%p1 = getelementptr inbounds [0 x i32], [0 x i32]* %base, i64 0, i64 0
%p2 = getelementptr inbounds [0 x i32], [0 x i32]* %base, i64 0, i64 %idx		%p2 = getelementptr inbounds [0 x i32], [0 x i32]* %base, i64 0, i64 %idx
%i1 = ptrtoint i32* %p1 to i64		%i1 = ptrtoint i32* %p1 to i64
%i2 = ptrtoint i32* %p2 to i64		%i2 = ptrtoint i32* %p2 to i64
%d = sub nuw i64 %i2, %i1		%d = sub nuw i64 %i2, %i1
ret i64 %d		ret i64 %d
}		}

define i64 @test_nuw([0 x i32]* %base, i64 %idx) {		define i64 @test_nuw([0 x i32]* %base, i64 %idx) {
; CHECK-LABEL: @test_nuw(		; CHECK-LABEL: @test_nuw(
; CHECK-NEXT: [[P2_IDX:%.]] = shl i64 [[IDX:%.]], 2		; CHECK-NEXT: [[P2_IDX:%.]] = shl i64 [[IDX:%.]], 2
; CHECK-NEXT: ret i64 [[P2_IDX]]		; CHECK-NEXT: ret i64 [[P2_IDX]]
;		;
%p1 = getelementptr [0 x i32], [0 x i32]* %base, i64 0, i64 0		%p1 = getelementptr [0 x i32], [0 x i32]* %base, i64 0, i64 0
%p2 = getelementptr [0 x i32], [0 x i32]* %base, i64 0, i64 %idx		%p2 = getelementptr [0 x i32], [0 x i32]* %base, i64 0, i64 %idx
%i1 = ptrtoint i32* %p1 to i64		%i1 = ptrtoint i32* %p1 to i64
%i2 = ptrtoint i32* %p2 to i64		%i2 = ptrtoint i32* %p2 to i64
%d = sub nuw i64 %i2, %i1		%d = sub nuw i64 %i2, %i1
ret i64 %d		ret i64 %d
}		}
		lebedev.riUnsubmitted Done Reply Inline Actions ---------------------------------------- define i64 @test_nuw(* %base, i64 %idx) { %0: %p1 = gep * %base, 0 x i64 0, 4 x i64 0 %p2 = gep * %base, 0 x i64 0, 4 x i64 %idx %i1 = ptrtoint * %p1 to i64 %i2 = ptrtoint * %p2 to i64 %d = sub nuw i64 %i2, %i1 ret i64 %d } => define i64 @test_nuw(* %base, i64 %idx) { %0: %P2_IDX = shl nuw i64 %idx, 2 ret i64 %P2_IDX } Transformation doesn't verify! ERROR: Target is more poisonous than source Example: * %base = null i64 %idx = undef Source: * %p1 = null * %p2 = null [based on undef value] i64 %i1 = #x0000000000000000 (0) i64 %i2 = #x0000000000000000 (0) i64 %d = #x0000000000000000 (0) Target: i64 %P2_IDX = poison Source value: #x0000000000000000 (0) Target value: poison Summary: 0 correct transformations 1 incorrect transformations 0 errors lebedev.ri: ``` ---------------------------------------- define i64 @test_nuw(* %base, i64 %idx) { %0…
		nikicAuthorUnsubmitted Done Reply Inline Actions Thanks for catching this! To give a more specific example, if %base=0 and %idx has only the top bit set, then %p1 and %p2 will both be zero and the original sub is nuw, but shifting the %idx is not nuw. nikic: Thanks for catching this! To give a more specific example, if %base=0 and %idx has only the top…

define i32 @test_inbounds_nuw_trunc([0 x i32]* %base, i64 %idx) {		define i32 @test_inbounds_nuw_trunc([0 x i32]* %base, i64 %idx) {
; CHECK-LABEL: @test_inbounds_nuw_trunc(		; CHECK-LABEL: @test_inbounds_nuw_trunc(
; CHECK-NEXT: [[IDX_TR:%.]] = trunc i64 [[IDX:%.]] to i32		; CHECK-NEXT: [[IDX_TR:%.]] = trunc i64 [[IDX:%.]] to i32
; CHECK-NEXT: [[TMP1:%.*]] = shl i32 [[IDX_TR]], 2		; CHECK-NEXT: [[TMP1:%.*]] = shl i32 [[IDX_TR]], 2
; CHECK-NEXT: ret i32 [[TMP1]]		; CHECK-NEXT: ret i32 [[TMP1]]
;		;
%p1 = getelementptr inbounds [0 x i32], [0 x i32]* %base, i64 0, i64 0		%p1 = getelementptr inbounds [0 x i32], [0 x i32]* %base, i64 0, i64 0
Show All 30 Lines	;
%p1 = getelementptr inbounds [0 x i32], [0 x i32]* %base, i64 0, i64 %idx		%p1 = getelementptr inbounds [0 x i32], [0 x i32]* %base, i64 0, i64 %idx
%p2 = getelementptr inbounds [0 x i32], [0 x i32]* %base, i64 0, i64 %idx2		%p2 = getelementptr inbounds [0 x i32], [0 x i32]* %base, i64 0, i64 %idx2
%i1 = ptrtoint i32* %p1 to i64		%i1 = ptrtoint i32* %p1 to i64
%i2 = ptrtoint i32* %p2 to i64		%i2 = ptrtoint i32* %p2 to i64
%d = sub nuw i64 %i2, %i1		%d = sub nuw i64 %i2, %i1
ret i64 %d		ret i64 %d
}		}

define i64 @test_inbounds_nuw_multi_index([0 x [2 x i32]]* %base, i64 %idx, i64 %idx2) {		define i64 @test_inbounds_nuw_multi_index([0 x [2 x i32]]* %base, i64 %idx, i64 %idx2) {
		lebedev.riUnsubmitted Done Reply Inline Actions Precommit this? lebedev.ri: Precommit this?
; CHECK-LABEL: @test_inbounds_nuw_multi_index(		; CHECK-LABEL: @test_inbounds_nuw_multi_index(
; CHECK-NEXT: [[P2_IDX:%.]] = shl nsw i64 [[IDX:%.]], 3		; CHECK-NEXT: [[P2_IDX:%.]] = shl nsw i64 [[IDX:%.]], 3
; CHECK-NEXT: [[P2_IDX1:%.]] = shl nsw i64 [[IDX2:%.]], 2		; CHECK-NEXT: [[P2_IDX1:%.]] = shl nsw i64 [[IDX2:%.]], 2
; CHECK-NEXT: [[P2_OFFS2:%.*]] = add i64 [[P2_IDX]], [[P2_IDX1]]		; CHECK-NEXT: [[P2_OFFS2:%.*]] = add i64 [[P2_IDX]], [[P2_IDX1]]
; CHECK-NEXT: ret i64 [[P2_OFFS2]]		; CHECK-NEXT: ret i64 [[P2_OFFS2]]
;		;
%p1 = getelementptr inbounds [0 x [2 x i32]], [0 x [2 x i32]]* %base, i64 0, i64 0, i64 0		%p1 = getelementptr inbounds [0 x [2 x i32]], [0 x [2 x i32]]* %base, i64 0, i64 0, i64 0
%p2 = getelementptr inbounds [0 x [2 x i32]], [0 x [2 x i32]]* %base, i64 0, i64 %idx, i64 %idx2		%p2 = getelementptr inbounds [0 x [2 x i32]], [0 x [2 x i32]]* %base, i64 0, i64 %idx, i64 %idx2
%i1 = ptrtoint i32* %p1 to i64		%i1 = ptrtoint i32* %p1 to i64
%i2 = ptrtoint i32* %p2 to i64		%i2 = ptrtoint i32* %p2 to i64
%d = sub nuw i64 %i2, %i1		%d = sub nuw i64 %i2, %i1
ret i64 %d		ret i64 %d
}		}

This is an archive of the discontinued LLVM Phabricator instance.

[InstCombine] Preserve nuw on sub of geps (PR44419)ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 237488

llvm/lib/Transforms/InstCombine/InstCombineAddSub.cpp

llvm/lib/Transforms/InstCombine/InstCombineInternal.h

llvm/test/Transforms/InstCombine/sub-gep.ll

[InstCombine] Preserve nuw on sub of geps (PR44419)
ClosedPublic