This is an archive of the discontinued LLVM Phabricator instance.

Paths

Table of Contentst

-
llvm/
-
include/llvm/Analysis/Utils/
-
llvm/
-
Analysis/
-
Utils/
-
Local.h
-
lib/Transforms/InstCombine/
-
Transforms/
-
InstCombine/
-
InstCombineAddSub.cpp
-
InstCombineInternal.h
-
InstructionCombining.cpp
-
test/Transforms/InstCombine/
-
Transforms/
-
InstCombine/
3/3
sub-gep.ll

Differential D72048

[InstCombine] Preserve nuw on sub of geps (PR44419)
ClosedPublic

Authored by nikic on Jan 1 2020, 2:19 AM.

Download Raw Diff

Details

Reviewers

spatel
lebedev.ri
RKSimon
reames
nlopes

Commits

rG0e322c8a1f20: [InstCombine] Preserve nuw on sub of geps (PR44419)

Summary

Fix https://bugs.llvm.org/show_bug.cgi?id=44419 by preserving the nuw on sub of geps. We only do this for the simple case where we have one non-swapped gep. We could also preserve some information for the two gep case, but this would be more complicated.

Diff Detail

Event Timeline

nikic created this revision.Jan 1 2020, 2:19 AM

Herald added a project: Restricted Project. · View Herald TranscriptJan 1 2020, 2:19 AM

Herald added subscribers: llvm-commits, hiraditya. · View Herald Transcript

Thank you for looking into this.

llvm/test/Transforms/InstCombine/sub-gep.ll

30–41

----------------------------------------
define i64 @test_nuw(* %base, i64 %idx) {
%0:
  %p1 = gep * %base, 0 x i64 0, 4 x i64 0
  %p2 = gep * %base, 0 x i64 0, 4 x i64 %idx
  %i1 = ptrtoint * %p1 to i64
  %i2 = ptrtoint * %p2 to i64
  %d = sub nuw i64 %i2, %i1
  ret i64 %d
}
=>
define i64 @test_nuw(* %base, i64 %idx) {
%0:
  %P2_IDX = shl nuw i64 %idx, 2
  ret i64 %P2_IDX
}
Transformation doesn't verify!
ERROR: Target is more poisonous than source

Example:
* %base = null
i64 %idx = undef

Source:
* %p1 = null
* %p2 = null    [based on undef value]
i64 %i1 = #x0000000000000000 (0)
i64 %i2 = #x0000000000000000 (0)
i64 %d = #x0000000000000000 (0)

Target:
i64 %P2_IDX = poison
Source value: #x0000000000000000 (0)
Target value: poison

Summary:
  0 correct transformations
  1 incorrect transformations
  0 errors

This revision now requires changes to proceed.Jan 1 2020, 2:36 AM

Only add nuw if the gep is also inbounds.

nikic marked 2 inline comments as done.Jan 1 2020, 3:11 AM

nikic added inline comments.

llvm/test/Transforms/InstCombine/sub-gep.ll
30–41	Thanks for catching this! To give a more specific example, if %base=0 and %idx has only the top bit set, then %p1 and %p2 will both be zero and the original sub is nuw, but shifting the %idx is not nuw.

I think this is still not quite right for the case where there are multiple GEP indexes. For example:

define i64 @test_inbounds_nuw_multi_index([0 x [2 x i32]]* %base, i64 %idx, i64 %idx2) {
; CHECK-LABEL: @test_inbounds_nuw_multi_index(
; CHECK-NEXT:    [[P2_IDX:%.*]] = shl nuw nsw i64 [[IDX:%.*]], 3
; CHECK-NEXT:    [[P2_IDX1:%.*]] = shl nuw nsw i64 [[IDX2:%.*]], 2
; CHECK-NEXT:    [[P2_OFFS2:%.*]] = add i64 [[P2_IDX]], [[P2_IDX1]]
; CHECK-NEXT:    ret i64 [[P2_OFFS2]]
;
  %p1 = getelementptr inbounds [0 x [2 x i32]], [0 x [2 x i32]]* %base, i64 0, i64 0, i64 0
  %p2 = getelementptr inbounds [0 x [2 x i32]], [0 x [2 x i32]]* %base, i64 0, i64 %idx, i64 %idx2
  %i1 = ptrtoint i32* %p1 to i64
  %i2 = ptrtoint i32* %p2 to i64
  %d = sub nuw i64 %i2, %i1
  ret i64 %d
}

Let's say %idx=-1, %idx2=4, then the overall result is 8 * %idx1 + 4 * %idx2 = 8, which is positive, even though one of the intermediate indexes is negative and as such can't use shl nuw. I think in this case the nuw can't be on any of the instructions (including also not the add). Right?

In D72048#1800331, @nikic wrote:
I think this is still not quite right for the case where there are multiple GEP indexes. For example:
define i64 @test_inbounds_nuw_multi_index([0 x [2 x i32]]* %base, i64 %idx, i64 %idx2) {
; CHECK-LABEL: @test_inbounds_nuw_multi_index(
; CHECK-NEXT:    [[P2_IDX:%.*]] = shl nuw nsw i64 [[IDX:%.*]], 3
; CHECK-NEXT:    [[P2_IDX1:%.*]] = shl nuw nsw i64 [[IDX2:%.*]], 2
; CHECK-NEXT:    [[P2_OFFS2:%.*]] = add i64 [[P2_IDX]], [[P2_IDX1]]
; CHECK-NEXT:    ret i64 [[P2_OFFS2]]
;
  %p1 = getelementptr inbounds [0 x [2 x i32]], [0 x [2 x i32]]* %base, i64 0, i64 0, i64 0
  %p2 = getelementptr inbounds [0 x [2 x i32]], [0 x [2 x i32]]* %base, i64 0, i64 %idx, i64 %idx2
  %i1 = ptrtoint i32* %p1 to i64
  %i2 = ptrtoint i32* %p2 to i64
  %d = sub nuw i64 %i2, %i1
  ret i64 %d
}
Let's say %idx=-1, %idx2=4, then the overall result is 8 * %idx1 + 4 * %idx2 = 8, which is positive, even though one of the intermediate indexes is negative and as such can't use shl nuw. I think in this case the nuw can't be on any of the instructions (including also not the add). Right?

Sure.

----------------------------------------
define i64 @test_inbounds_nuw_multi_index(* %base, i64 %idx, i64 %idx2) {
%0:
  %p1 = gep inbounds * %base, 0 x i64 0, 8 x i64 0, 4 x i64 0
  %p2 = gep inbounds * %base, 0 x i64 0, 8 x i64 %idx, 4 x i64 %idx2
  %i1 = ptrtoint * %p1 to i64
  %i2 = ptrtoint * %p2 to i64
  %d = sub nuw i64 %i2, %i1
  ret i64 %d
}
=>
define i64 @test_inbounds_nuw_multi_index(* %base, i64 %idx, i64 %idx2) {
%0:
  %P2_IDX = shl nsw nuw i64 %idx, 3
  %P2_IDX1 = shl nsw nuw i64 %idx2, 2
  %P2_OFFS2 = add i64 %P2_IDX, %P2_IDX1
  ret i64 %P2_OFFS2
}
Transformation doesn't verify!
ERROR: Target is more poisonous than source

Example:
* %base = pointer(non-local, block_id=1, offset=498773658766409739)
i64 %idx = #x0322800007800000 (225883668936130560)
i64 %idx2 = #xfa00000000000000 (18014398509481984000, -432345564227567616)

Source:
* %p1 = pointer(non-local, block_id=1, offset=498773658766409739)
* %p2 = pointer(non-local, block_id=1, offset=576460753345183755)
i64 %i1 = #x171bffffc3ffffff (1665205961213607935)
i64 %i2 = #x182fffffffffffff (1742893055792381951)
i64 %d = #x011400003c000000 (77687094578774016)

Target:
i64 %P2_IDX = #x191400003c000000 (1807069351489044480)
i64 %P2_IDX1 = poison
i64 %P2_OFFS2 = poison
Source value: #x011400003c000000 (77687094578774016)
Target value: poison

Summary:
  0 correct transformations
  1 incorrect transformations
  0 errors

----------------------------------------
define i64 @test_inbounds_nuw_multi_index(* %base, i64 %idx, i64 %idx2) {
%0:
  %p1 = gep inbounds * %base, 0 x i64 0, 8 x i64 0, 4 x i64 0
  %p2 = gep inbounds * %base, 0 x i64 0, 8 x i64 %idx, 4 x i64 %idx2
  %i1 = ptrtoint * %p1 to i64
  %i2 = ptrtoint * %p2 to i64
  %d = sub nuw i64 %i2, %i1
  ret i64 %d
}
=>
define i64 @test_inbounds_nuw_multi_index(* %base, i64 %idx, i64 %idx2) {
%0:
  %P2_IDX = shl nsw i64 %idx, 3
  %P2_IDX1 = shl nsw i64 %idx2, 2
  %P2_OFFS2 = add i64 %P2_IDX, %P2_IDX1
  ret i64 %P2_OFFS2
}
Transformation seems to be correct!

Summary:
  1 correct transformations
  0 incorrect transformations
  0 errors

alex added a subscriber: alex.Jan 1 2020, 5:40 AM

Fun fact: If you change https://github.com/llvm/llvm-project/blob/773667b8c20d35c18334f8c7663df8ceacfdd2e5/llvm/include/llvm/Analysis/Utils/Local.h#L92 to not emit a useless add 0, %x you get a regression in https://github.com/llvm/llvm-project/blob/773667b8c20d35c18334f8c7663df8ceacfdd2e5/llvm/test/Transforms/InstCombine/icmp.ll#L513-L524, because IRBuilder instructions get inserted into the InstCombine worklist in the wrong order :(

Only add nuw to final mul.

As the scope of this optimization turned out to be a lot smaller than I originally expected, I've moved this as a fixup operation in OptimizePointerDifference(), instead of directly emitting the nuw flag in EmitGEPOffset(), which is somewhat tricky to do.

The code is slightly odd due to the need to match the zero add, which I wasn't able to simply drop for the reason mentioned above.

RKSimon added reviewers: reames, nlopes.Jan 2 2020, 10:45 AM

Ping

Not really familiar with this code.
This seems correct to me, but maybe i'm missing some subtlety.

llvm/test/Transforms/InstCombine/sub-gep.ll
88	Precommit this?

This revision is now accepted and ready to land.Jan 8 2020, 2:54 PM

Closed by commit rG0e322c8a1f20: [InstCombine] Preserve nuw on sub of geps (PR44419) (authored by nikic). · Explain WhyJan 11 2020, 2:04 AM

This revision was automatically updated to reflect the committed changes.

nikic marked an inline comment as done.

Revision Contents

Path

Size

llvm/

include/

llvm/

Analysis/

Utils/

Local.h

8 lines

lib/

Transforms/

InstCombine/

InstCombineAddSub.cpp

11 lines

InstCombineInternal.h

5 lines

InstructionCombining.cpp

5 lines

test/

Transforms/

InstCombine/

sub-gep.ll

4 lines

Diff 235749

llvm/include/llvm/Analysis/Utils/Local.h

Show All 21 Lines

/// Given a getelementptr instruction/constantexpr, emit the code necessary to		/// Given a getelementptr instruction/constantexpr, emit the code necessary to
/// compute the offset from the base pointer (without adding in the base		/// compute the offset from the base pointer (without adding in the base
/// pointer). Return the result as a signed integer of intptr size.		/// pointer). Return the result as a signed integer of intptr size.
/// When NoAssumptions is true, no assumptions about index computation not		/// When NoAssumptions is true, no assumptions about index computation not
/// overflowing is made.		/// overflowing is made.
template <typename IRBuilderTy>		template <typename IRBuilderTy>
Value EmitGEPOffset(IRBuilderTy Builder, const DataLayout &DL, User *GEP,		Value EmitGEPOffset(IRBuilderTy Builder, const DataLayout &DL, User *GEP,
bool NoAssumptions = false) {		bool NoAssumptions = false, bool IsNonNegative = false) {
GEPOperator *GEPOp = cast<GEPOperator>(GEP);		GEPOperator *GEPOp = cast<GEPOperator>(GEP);
Type *IntIdxTy = DL.getIndexType(GEP->getType());		Type *IntIdxTy = DL.getIndexType(GEP->getType());
Value *Result = Constant::getNullValue(IntIdxTy);		Value *Result = Constant::getNullValue(IntIdxTy);

// If the GEP is inbounds, we know that none of the addressing operations will		// If the GEP is inbounds, we know that none of the addressing operations will
// overflow in a signed sense.		// overflow in a signed sense.
bool isInBounds = GEPOp->isInBounds() && !NoAssumptions;		bool isInBounds = GEPOp->isInBounds() && !NoAssumptions;

Show All 23 Lines	if (Constant *OpC = dyn_cast<Constant>(Op)) {
}		}

// Splat the constant if needed.		// Splat the constant if needed.
if (IntIdxTy->isVectorTy() && !OpC->getType()->isVectorTy())		if (IntIdxTy->isVectorTy() && !OpC->getType()->isVectorTy())
OpC = ConstantVector::getSplat(IntIdxTy->getVectorNumElements(), OpC);		OpC = ConstantVector::getSplat(IntIdxTy->getVectorNumElements(), OpC);

Constant *Scale = ConstantInt::get(IntIdxTy, Size);		Constant *Scale = ConstantInt::get(IntIdxTy, Size);
Constant OC = ConstantExpr::getIntegerCast(OpC, IntIdxTy, true /SExt*/);		Constant OC = ConstantExpr::getIntegerCast(OpC, IntIdxTy, true /SExt*/);
Scale =		Scale = ConstantExpr::getMul(
ConstantExpr::getMul(OC, Scale, false /NUW/, isInBounds /NSW/);		OC, Scale, IsNonNegative /NUW/, isInBounds /NSW/);
// Emit an add instruction.		// Emit an add instruction.
Result = Builder->CreateAdd(Result, Scale, GEP->getName()+".offs");		Result = Builder->CreateAdd(Result, Scale, GEP->getName()+".offs");
continue;		continue;
}		}

// Splat the index if needed.		// Splat the index if needed.
if (IntIdxTy->isVectorTy() && !Op->getType()->isVectorTy())		if (IntIdxTy->isVectorTy() && !Op->getType()->isVectorTy())
Op = Builder->CreateVectorSplat(IntIdxTy->getVectorNumElements(), Op);		Op = Builder->CreateVectorSplat(IntIdxTy->getVectorNumElements(), Op);

// Convert to correct type.		// Convert to correct type.
if (Op->getType() != IntIdxTy)		if (Op->getType() != IntIdxTy)
Op = Builder->CreateIntCast(Op, IntIdxTy, true, Op->getName()+".c");		Op = Builder->CreateIntCast(Op, IntIdxTy, true, Op->getName()+".c");
if (Size != 1) {		if (Size != 1) {
// We'll let instcombine(mul) convert this to a shl if possible.		// We'll let instcombine(mul) convert this to a shl if possible.
Op = Builder->CreateMul(Op, ConstantInt::get(IntIdxTy, Size),		Op = Builder->CreateMul(Op, ConstantInt::get(IntIdxTy, Size),
GEP->getName() + ".idx", false /NUW/,		GEP->getName() + ".idx", IsNonNegative /NUW/,
isInBounds /NSW/);		isInBounds /NSW/);
}		}

// Emit an add instruction.		// Emit an add instruction.
Result = Builder->CreateAdd(Op, Result, GEP->getName()+".offs");		Result = Builder->CreateAdd(Op, Result, GEP->getName()+".offs");
}		}
return Result;		return Result;
}		}

}		}

#endif // LLVM_TRANSFORMS_UTILS_LOCAL_H		#endif // LLVM_TRANSFORMS_UTILS_LOCAL_H

llvm/lib/Transforms/InstCombine/InstCombineAddSub.cpp

Show First 20 Lines • Show All 1,579 Lines • ▼ Show 20 Lines	Instruction *InstCombiner::visitFAdd(BinaryOperator &I) {

return nullptr;		return nullptr;
}		}

/// Optimize pointer differences into the same array into a size. Consider:		/// Optimize pointer differences into the same array into a size. Consider:
/// &A[10] - &A[0]: we should compile this to "10". LHS/RHS are the pointer		/// &A[10] - &A[0]: we should compile this to "10". LHS/RHS are the pointer
/// operands to the ptrtoint instructions for the LHS/RHS of the subtract.		/// operands to the ptrtoint instructions for the LHS/RHS of the subtract.
Value InstCombiner::OptimizePointerDifference(Value LHS, Value *RHS,		Value InstCombiner::OptimizePointerDifference(Value LHS, Value *RHS,
Type *Ty) {		Type *Ty, bool IsNUW) {
// If LHS is a gep based on RHS or RHS is a gep based on LHS, we can optimize		// If LHS is a gep based on RHS or RHS is a gep based on LHS, we can optimize
// this.		// this.
bool Swapped = false;		bool Swapped = false;
GEPOperator GEP1 = nullptr, GEP2 = nullptr;		GEPOperator GEP1 = nullptr, GEP2 = nullptr;

// For now we require one side to be the base pointer "A" or a constant		// For now we require one side to be the base pointer "A" or a constant
// GEP derived from it.		// GEP derived from it.
if (GEPOperator *LHSGEP = dyn_cast<GEPOperator>(LHS)) {		if (GEPOperator *LHSGEP = dyn_cast<GEPOperator>(LHS)) {
▲ Show 20 Lines • Show All 49 Lines • ▼ Show 20 Lines	if (GEP2) {
if (NumNonConstantIndices1 + NumNonConstantIndices2 > 1 &&		if (NumNonConstantIndices1 + NumNonConstantIndices2 > 1 &&
((NumNonConstantIndices1 > 0 && !GEP1->hasOneUse()) \|\|		((NumNonConstantIndices1 > 0 && !GEP1->hasOneUse()) \|\|
(NumNonConstantIndices2 > 0 && !GEP2->hasOneUse()))) {		(NumNonConstantIndices2 > 0 && !GEP2->hasOneUse()))) {
return nullptr;		return nullptr;
}		}
}		}

// Emit the offset of the GEP and an intptr_t.		// Emit the offset of the GEP and an intptr_t.
Value *Result = EmitGEPOffset(GEP1);		bool IsNonNegative = IsNUW && !GEP2 && !Swapped;
		Value *Result = EmitGEPOffset(GEP1, IsNonNegative);

// If we had a constant expression GEP on the other side offsetting the		// If we had a constant expression GEP on the other side offsetting the
// pointer, subtract it from the offset we have.		// pointer, subtract it from the offset we have.
if (GEP2) {		if (GEP2) {
Value *Offset = EmitGEPOffset(GEP2);		Value *Offset = EmitGEPOffset(GEP2);
Result = Builder.CreateSub(Result, Offset);		Result = Builder.CreateSub(Result, Offset);
}		}

▲ Show 20 Lines • Show All 315 Lines • ▼ Show 20 Lines	if (Op1->hasOneUse()) {
}		}
}		}

// Optimize pointer differences into the same array into a size. Consider:		// Optimize pointer differences into the same array into a size. Consider:
// &A[10] - &A[0]: we should compile this to "10".		// &A[10] - &A[0]: we should compile this to "10".
Value LHSOp, RHSOp;		Value LHSOp, RHSOp;
if (match(Op0, m_PtrToInt(m_Value(LHSOp))) &&		if (match(Op0, m_PtrToInt(m_Value(LHSOp))) &&
match(Op1, m_PtrToInt(m_Value(RHSOp))))		match(Op1, m_PtrToInt(m_Value(RHSOp))))
if (Value *Res = OptimizePointerDifference(LHSOp, RHSOp, I.getType()))		if (Value *Res = OptimizePointerDifference(LHSOp, RHSOp, I.getType(),
		I.hasNoUnsignedWrap()))
return replaceInstUsesWith(I, Res);		return replaceInstUsesWith(I, Res);

// trunc(p)-trunc(q) -> trunc(p-q)		// trunc(p)-trunc(q) -> trunc(p-q)
if (match(Op0, m_Trunc(m_PtrToInt(m_Value(LHSOp)))) &&		if (match(Op0, m_Trunc(m_PtrToInt(m_Value(LHSOp)))) &&
match(Op1, m_Trunc(m_PtrToInt(m_Value(RHSOp)))))		match(Op1, m_Trunc(m_PtrToInt(m_Value(RHSOp)))))
if (Value *Res = OptimizePointerDifference(LHSOp, RHSOp, I.getType()))		if (Value *Res = OptimizePointerDifference(LHSOp, RHSOp, I.getType(),
		/* IsNUW */ false))
return replaceInstUsesWith(I, Res);		return replaceInstUsesWith(I, Res);

// Canonicalize a shifty way to code absolute value to the common pattern.		// Canonicalize a shifty way to code absolute value to the common pattern.
// There are 2 potential commuted variants.		// There are 2 potential commuted variants.
// We're relying on the fact that we only do this transform when the shift has		// We're relying on the fact that we only do this transform when the shift has
// exactly 2 uses and the xor has exactly 1 use (otherwise, we might increase		// exactly 2 uses and the xor has exactly 1 use (otherwise, we might increase
// instructions).		// instructions).
Value *A;		Value *A;
▲ Show 20 Lines • Show All 212 Lines • Show Last 20 Lines

llvm/lib/Transforms/InstCombine/InstCombineInternal.h

Show First 20 Lines • Show All 363 Lines • ▼ Show 20 Lines	public:
// Return Value:		// Return Value:
// null - No change was made		// null - No change was made
// I - Change was made, I is still valid, I may be dead though		// I - Change was made, I is still valid, I may be dead though
// otherwise - Change was made, replace I with returned instruction		// otherwise - Change was made, replace I with returned instruction
//		//
Instruction *visitFNeg(UnaryOperator &I);		Instruction *visitFNeg(UnaryOperator &I);
Instruction *visitAdd(BinaryOperator &I);		Instruction *visitAdd(BinaryOperator &I);
Instruction *visitFAdd(BinaryOperator &I);		Instruction *visitFAdd(BinaryOperator &I);
Value OptimizePointerDifference(Value LHS, Value RHS, Type Ty);		Value *OptimizePointerDifference(
		Value LHS, Value RHS, Type *Ty, bool IsNUW);
Instruction *visitSub(BinaryOperator &I);		Instruction *visitSub(BinaryOperator &I);
Instruction *visitFSub(BinaryOperator &I);		Instruction *visitFSub(BinaryOperator &I);
Instruction *visitMul(BinaryOperator &I);		Instruction *visitMul(BinaryOperator &I);
Instruction *visitFMul(BinaryOperator &I);		Instruction *visitFMul(BinaryOperator &I);
Instruction *visitURem(BinaryOperator &I);		Instruction *visitURem(BinaryOperator &I);
Instruction *visitSRem(BinaryOperator &I);		Instruction *visitSRem(BinaryOperator &I);
Instruction *visitFRem(BinaryOperator &I);		Instruction *visitFRem(BinaryOperator &I);
bool simplifyDivRemOfSelectWithZeroOp(BinaryOperator &I);		bool simplifyDivRemOfSelectWithZeroOp(BinaryOperator &I);
▲ Show 20 Lines • Show All 208 Lines • ▼ Show 20 Lines	bool willNotOverflow(BinaryOperator::BinaryOps Opcode, const Value *LHS,
switch (Opcode) {		switch (Opcode) {
case Instruction::Add: return willNotOverflowAdd(LHS, RHS, CxtI, IsSigned);		case Instruction::Add: return willNotOverflowAdd(LHS, RHS, CxtI, IsSigned);
case Instruction::Sub: return willNotOverflowSub(LHS, RHS, CxtI, IsSigned);		case Instruction::Sub: return willNotOverflowSub(LHS, RHS, CxtI, IsSigned);
case Instruction::Mul: return willNotOverflowMul(LHS, RHS, CxtI, IsSigned);		case Instruction::Mul: return willNotOverflowMul(LHS, RHS, CxtI, IsSigned);
default: llvm_unreachable("Unexpected opcode for overflow query");		default: llvm_unreachable("Unexpected opcode for overflow query");
}		}
}		}

Value EmitGEPOffset(User GEP);		Value EmitGEPOffset(User GEP, bool IsNonNegative = false);
Instruction scalarizePHI(ExtractElementInst &EI, PHINode PN);		Instruction scalarizePHI(ExtractElementInst &EI, PHINode PN);
Instruction *foldCastedBitwiseLogic(BinaryOperator &I);		Instruction *foldCastedBitwiseLogic(BinaryOperator &I);
Instruction *narrowBinOp(TruncInst &Trunc);		Instruction *narrowBinOp(TruncInst &Trunc);
Instruction *narrowMaskedBinOp(BinaryOperator &And);		Instruction *narrowMaskedBinOp(BinaryOperator &And);
Instruction *narrowMathIfNoOverflow(BinaryOperator &I);		Instruction *narrowMathIfNoOverflow(BinaryOperator &I);
Instruction *narrowRotate(TruncInst &Trunc);		Instruction *narrowRotate(TruncInst &Trunc);
Instruction optimizeBitCastFromPhi(CastInst &CI, PHINode PN);		Instruction optimizeBitCastFromPhi(CastInst &CI, PHINode PN);
Instruction *matchSAddSubSat(SelectInst &MinMax1);		Instruction *matchSAddSubSat(SelectInst &MinMax1);
▲ Show 20 Lines • Show All 402 Lines • Show Last 20 Lines

llvm/lib/Transforms/InstCombine/InstructionCombining.cpp

	Show First 20 Lines • Show All 152 Lines • ▼ Show 20 Lines
	// increases variable availability at the cost of accuracy. Variables that			// increases variable availability at the cost of accuracy. Variables that
	// cannot be promoted by mem2reg or SROA will be described as living in memory			// cannot be promoted by mem2reg or SROA will be described as living in memory
	// for their entire lifetime. However, passes like DSE and instcombine can			// for their entire lifetime. However, passes like DSE and instcombine can
	// delete stores to the alloca, leading to misleading and inaccurate debug			// delete stores to the alloca, leading to misleading and inaccurate debug
	// information. This flag can be removed when those passes are fixed.			// information. This flag can be removed when those passes are fixed.
	static cl::opt<unsigned> ShouldLowerDbgDeclare("instcombine-lower-dbg-declare",			static cl::opt<unsigned> ShouldLowerDbgDeclare("instcombine-lower-dbg-declare",
	cl::Hidden, cl::init(true));			cl::Hidden, cl::init(true));

	Value InstCombiner::EmitGEPOffset(User GEP) {			Value InstCombiner::EmitGEPOffset(User GEP, bool IsNonNegative) {
	return llvm::EmitGEPOffset(&Builder, DL, GEP);			return llvm::EmitGEPOffset(&Builder, DL, GEP, /* NoAssumptions */ false,
				IsNonNegative);
	}			}

	/// Return true if it is desirable to convert an integer computation from a			/// Return true if it is desirable to convert an integer computation from a
	/// given bit width to a new bit width.			/// given bit width to a new bit width.
	/// We don't want to convert from a legal to an illegal type or from a smaller			/// We don't want to convert from a legal to an illegal type or from a smaller
	/// to a larger illegal type. A width of '1' is always treated as a legal type			/// to a larger illegal type. A width of '1' is always treated as a legal type
	/// because i1 is a fundamental type in IR, and there are many specialized			/// because i1 is a fundamental type in IR, and there are many specialized
	/// optimizations for i1 types. Widths of 8, 16 or 32 are equally treated as			/// optimizations for i1 types. Widths of 8, 16 or 32 are equally treated as
	▲ Show 20 Lines • Show All 3,572 Lines • Show Last 20 Lines

llvm/test/Transforms/InstCombine/sub-gep.ll

Show All 10 Lines	;
%i1 = ptrtoint i32* %p1 to i64		%i1 = ptrtoint i32* %p1 to i64
%i2 = ptrtoint i32* %p2 to i64		%i2 = ptrtoint i32* %p2 to i64
%d = sub i64 %i2, %i1		%d = sub i64 %i2, %i1
ret i64 %d		ret i64 %d
}		}

define i64 @test_inbounds_nuw([0 x i32]* %base, i64 %idx) {		define i64 @test_inbounds_nuw([0 x i32]* %base, i64 %idx) {
; CHECK-LABEL: @test_inbounds_nuw(		; CHECK-LABEL: @test_inbounds_nuw(
; CHECK-NEXT: [[P2_IDX:%.]] = shl nsw i64 [[IDX:%.]], 2		; CHECK-NEXT: [[P2_IDX:%.]] = shl nuw nsw i64 [[IDX:%.]], 2
; CHECK-NEXT: ret i64 [[P2_IDX]]		; CHECK-NEXT: ret i64 [[P2_IDX]]
;		;
%p1 = getelementptr inbounds [0 x i32], [0 x i32]* %base, i64 0, i64 0		%p1 = getelementptr inbounds [0 x i32], [0 x i32]* %base, i64 0, i64 0
%p2 = getelementptr inbounds [0 x i32], [0 x i32]* %base, i64 0, i64 %idx		%p2 = getelementptr inbounds [0 x i32], [0 x i32]* %base, i64 0, i64 %idx
%i1 = ptrtoint i32* %p1 to i64		%i1 = ptrtoint i32* %p1 to i64
%i2 = ptrtoint i32* %p2 to i64		%i2 = ptrtoint i32* %p2 to i64
%d = sub nuw i64 %i2, %i1		%d = sub nuw i64 %i2, %i1
ret i64 %d		ret i64 %d
}		}

define i64 @test_nuw([0 x i32]* %base, i64 %idx) {		define i64 @test_nuw([0 x i32]* %base, i64 %idx) {
; CHECK-LABEL: @test_nuw(		; CHECK-LABEL: @test_nuw(
; CHECK-NEXT: [[P2_IDX:%.]] = shl i64 [[IDX:%.]], 2		; CHECK-NEXT: [[P2_IDX:%.]] = shl nuw i64 [[IDX:%.]], 2
; CHECK-NEXT: ret i64 [[P2_IDX]]		; CHECK-NEXT: ret i64 [[P2_IDX]]
;		;
%p1 = getelementptr [0 x i32], [0 x i32]* %base, i64 0, i64 0		%p1 = getelementptr [0 x i32], [0 x i32]* %base, i64 0, i64 0
%p2 = getelementptr [0 x i32], [0 x i32]* %base, i64 0, i64 %idx		%p2 = getelementptr [0 x i32], [0 x i32]* %base, i64 0, i64 %idx
%i1 = ptrtoint i32* %p1 to i64		%i1 = ptrtoint i32* %p1 to i64
%i2 = ptrtoint i32* %p2 to i64		%i2 = ptrtoint i32* %p2 to i64
%d = sub nuw i64 %i2, %i1		%d = sub nuw i64 %i2, %i1
ret i64 %d		ret i64 %d
}		}
		lebedev.riUnsubmitted Done Reply Inline Actions ---------------------------------------- define i64 @test_nuw(* %base, i64 %idx) { %0: %p1 = gep * %base, 0 x i64 0, 4 x i64 0 %p2 = gep * %base, 0 x i64 0, 4 x i64 %idx %i1 = ptrtoint * %p1 to i64 %i2 = ptrtoint * %p2 to i64 %d = sub nuw i64 %i2, %i1 ret i64 %d } => define i64 @test_nuw(* %base, i64 %idx) { %0: %P2_IDX = shl nuw i64 %idx, 2 ret i64 %P2_IDX } Transformation doesn't verify! ERROR: Target is more poisonous than source Example: * %base = null i64 %idx = undef Source: * %p1 = null * %p2 = null [based on undef value] i64 %i1 = #x0000000000000000 (0) i64 %i2 = #x0000000000000000 (0) i64 %d = #x0000000000000000 (0) Target: i64 %P2_IDX = poison Source value: #x0000000000000000 (0) Target value: poison Summary: 0 correct transformations 1 incorrect transformations 0 errors lebedev.ri: ``` ---------------------------------------- define i64 @test_nuw(* %base, i64 %idx) { %0…
		nikicAuthorUnsubmitted Done Reply Inline Actions Thanks for catching this! To give a more specific example, if %base=0 and %idx has only the top bit set, then %p1 and %p2 will both be zero and the original sub is nuw, but shifting the %idx is not nuw. nikic: Thanks for catching this! To give a more specific example, if %base=0 and %idx has only the top…

define i32 @test_inbounds_nuw_trunc([0 x i32]* %base, i64 %idx) {		define i32 @test_inbounds_nuw_trunc([0 x i32]* %base, i64 %idx) {
; CHECK-LABEL: @test_inbounds_nuw_trunc(		; CHECK-LABEL: @test_inbounds_nuw_trunc(
; CHECK-NEXT: [[IDX_TR:%.]] = trunc i64 [[IDX:%.]] to i32		; CHECK-NEXT: [[IDX_TR:%.]] = trunc i64 [[IDX:%.]] to i32
; CHECK-NEXT: [[TMP1:%.*]] = shl i32 [[IDX_TR]], 2		; CHECK-NEXT: [[TMP1:%.*]] = shl i32 [[IDX_TR]], 2
; CHECK-NEXT: ret i32 [[TMP1]]		; CHECK-NEXT: ret i32 [[TMP1]]
;		;
%p1 = getelementptr inbounds [0 x i32], [0 x i32]* %base, i64 0, i64 0		%p1 = getelementptr inbounds [0 x i32], [0 x i32]* %base, i64 0, i64 0
Show All 28 Lines
; CHECK-NEXT: ret i64 [[TMP1]]		; CHECK-NEXT: ret i64 [[TMP1]]
;		;
%p1 = getelementptr inbounds [0 x i32], [0 x i32]* %base, i64 0, i64 %idx		%p1 = getelementptr inbounds [0 x i32], [0 x i32]* %base, i64 0, i64 %idx
%p2 = getelementptr inbounds [0 x i32], [0 x i32]* %base, i64 0, i64 %idx2		%p2 = getelementptr inbounds [0 x i32], [0 x i32]* %base, i64 0, i64 %idx2
%i1 = ptrtoint i32* %p1 to i64		%i1 = ptrtoint i32* %p1 to i64
%i2 = ptrtoint i32* %p2 to i64		%i2 = ptrtoint i32* %p2 to i64
%d = sub nuw i64 %i2, %i1		%d = sub nuw i64 %i2, %i1
ret i64 %d		ret i64 %d
}		}
		lebedev.riUnsubmitted Done Reply Inline Actions Precommit this? lebedev.ri: Precommit this?

This is an archive of the discontinued LLVM Phabricator instance.

[InstCombine] Preserve nuw on sub of geps (PR44419)ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 235749

llvm/include/llvm/Analysis/Utils/Local.h

llvm/lib/Transforms/InstCombine/InstCombineAddSub.cpp

llvm/lib/Transforms/InstCombine/InstCombineInternal.h

llvm/lib/Transforms/InstCombine/InstructionCombining.cpp

llvm/test/Transforms/InstCombine/sub-gep.ll

[InstCombine] Preserve nuw on sub of geps (PR44419)
ClosedPublic