This is an archive of the discontinued LLVM Phabricator instance.

Paths

Table of Contentst

-
llvm/
-
lib/Analysis/
-
Analysis/
3/3
ScalarEvolution.cpp
-
test/Analysis/ScalarEvolution/
-
Analysis/
-
ScalarEvolution/
5/5
sdiv.ll
-
srem.ll

Differential D82721

[ScalarEvolution] createSCEV(): recognize `udiv`/`urem` disguised as an `sdiv`/`srem`
ClosedPublic

Authored by lebedev.ri on Jun 28 2020, 10:43 AM.

Download Raw Diff

Details

Reviewers

mkazantsev
efriedma
nikic
reames

Commits

rG2c16100e6f72: [ScalarEvolution] createSCEV(): recognize `udiv`/`urem` disguised as an…

Summary

While InstCombine trivially converts that srem into a urem,
it might happen later than wanted, in particular i'd like
for that to happen on https://godbolt.org/z/bwuEmJ test case
early in pipeline, before first instcombine run, just before -mem2reg.

SCEV should recognize this case natively.

Diff Detail

Repository: rG LLVM Github Monorepo

Event Timeline

lebedev.ri created this revision.Jun 28 2020, 10:43 AM

Herald added a project: Restricted Project. · View Herald TranscriptJun 28 2020, 10:43 AM

Herald added subscribers: llvm-commits, javed.absar, hiraditya. · View Herald Transcript

lebedev.ri edited the summary of this revision. (Show Details)Jun 28 2020, 10:44 AM

lebedev.ri marked an inline comment as done.

lebedev.ri added inline comments.

llvm/lib/Analysis/ScalarEvolution.cpp
4343	This is a pretty verbatim copypasta from `InstCombiner::visitSRem()`

Harbormaster failed remote builds in B62058: Diff 273955!Jun 28 2020, 11:19 AM

Not sure I understand what benefit you're expecting on the linked testcase.

llvm/lib/Analysis/ScalarEvolution.cpp
4344	Can we stick this code into ScalarEvolution::createSCEV directly? I don't think any of the other users of MatchBinaryOp care whether they get a urem or an srem. Can we use the same code for sdiv?
4350	Can we not use isKnownNonNegative?

In D82721#2120692, @efriedma wrote:

Not sure I understand what benefit you're expecting on the linked testcase.

Since in SCEV it now becomes some expression (as opposed to just SCEVUnknown),
it can reason about it more. In particular, SCEVExpander tries to hoist stuff
as much as possible, and now that it is no longer some opaque SCEVUnknown,
but an SCEVURem with non-zero divisor, it gets hoisted.

Ex 1.: i & 1:

*** IR Dump Before rewrite allocas if that makes them promotable ***
; Function Attrs: uwtable
define dso_local void @_Z4loopi(i32 %width) local_unnamed_addr #0 {
entry:
  %storage = alloca [2 x i32], align 4
  %0 = bitcast [2 x i32]* %storage to i8*
  call void @llvm.lifetime.start.p0i8(i64 8, i8* %0) #3
  br label %for.cond

for.cond:                                         ; preds = %for.body, %entry
  %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.body ]
  %cmp = icmp ne i32 %i.0, %width
  br i1 %cmp, label %for.body, label %for.cond.cleanup

for.cond.cleanup:                                 ; preds = %for.cond
  call void @llvm.lifetime.end.p0i8(i64 8, i8* %0) #3
  ret void

for.body:                                         ; preds = %for.cond
  %and = and i32 %i.0, 1
  %1 = zext i32 %and to i64
  %arrayidx = getelementptr inbounds [2 x i32], [2 x i32]* %storage, i64 0, i64 %1
  %2 = load i32, i32* %arrayidx, align 4, !tbaa !2
  %call = call i32 @_Z3adji(i32 %2)
  %3 = load i32, i32* %arrayidx, align 4, !tbaa !2
  %add = add nsw i32 %3, %call
  store i32 %add, i32* %arrayidx, align 4, !tbaa !2
  %inc = add nsw i32 %i.0, 1
  br label %for.cond
}
*** IR Dump After rewrite allocas if that makes them promotable ***
; Function Attrs: uwtable
define dso_local void @_Z4loopi(i32 %width) local_unnamed_addr #0 {
entry:
  %storage.apc.retyped = alloca <8 x i8>, align 4
  br label %for.cond

for.cond:                                         ; preds = %for.body, %entry
  %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.body ]
  %0 = mul i32 %i.0, -1
  %1 = trunc i32 %0 to i1
  %2 = zext i1 %1 to i64
  %cmp = icmp ne i32 %i.0, %width
  br i1 %cmp, label %for.body, label %for.cond.cleanup

for.cond.cleanup:                                 ; preds = %for.cond
  ret void

for.body:                                         ; preds = %for.cond
  %3 = load <8 x i8>, <8 x i8>* %storage.apc.retyped, align 4
  %4 = bitcast <8 x i8> %3 to <2 x i32>
  %5 = extractelement <2 x i32> %4, i64 %2
  %call = call i32 @_Z3adji(i32 %5)
  %6 = load <8 x i8>, <8 x i8>* %storage.apc.retyped, align 4
  %7 = bitcast <8 x i8> %6 to <2 x i32>
  %8 = extractelement <2 x i32> %7, i64 %2
  %add = add nsw i32 %8, %call
  %9 = load <8 x i8>, <8 x i8>* %storage.apc.retyped, align 4
  %10 = bitcast <8 x i8> %9 to <2 x i32>
  %11 = insertelement <2 x i32> %10, i32 %add, i64 %2
  %12 = bitcast <2 x i32> %11 to <8 x i8>
  store <8 x i8> %12, <8 x i8>* %storage.apc.retyped, align 4
  %inc = add nsw i32 %i.0, 1
  br label %for.cond
}

So it got hoisted. But now,

Ex. 2: i % 2:

*** IR Dump Before rewrite allocas if that makes them promotable ***
; Function Attrs: uwtable
define dso_local void @_Z4loopi(i32 %width) local_unnamed_addr #0 {
entry:
  %storage = alloca [2 x i32], align 4
  %0 = bitcast [2 x i32]* %storage to i8*
  call void @llvm.lifetime.start.p0i8(i64 8, i8* %0) #3
  br label %for.cond

for.cond:                                         ; preds = %for.body, %entry
  %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.body ]
  %cmp = icmp ne i32 %i.0, %width
  br i1 %cmp, label %for.body, label %for.cond.cleanup

for.cond.cleanup:                                 ; preds = %for.cond
  call void @llvm.lifetime.end.p0i8(i64 8, i8* %0) #3
  ret void

for.body:                                         ; preds = %for.cond
  %rem = srem i32 %i.0, 2
  %idxprom = sext i32 %rem to i64
  %arrayidx = getelementptr inbounds [2 x i32], [2 x i32]* %storage, i64 0, i64 %idxprom
  %1 = load i32, i32* %arrayidx, align 4, !tbaa !2
  %call = call i32 @_Z3adji(i32 %1)
  %2 = load i32, i32* %arrayidx, align 4, !tbaa !2
  %add = add nsw i32 %2, %call
  store i32 %add, i32* %arrayidx, align 4, !tbaa !2
  %inc = add nsw i32 %i.0, 1
  br label %for.cond
}
*** IR Dump After rewrite allocas if that makes them promotable ***
; Function Attrs: uwtable
define dso_local void @_Z4loopi(i32 %width) local_unnamed_addr #0 {
entry:
  %storage.apc.retyped = alloca <8 x i8>, align 4
  br label %for.cond

for.cond:                                         ; preds = %for.body, %entry
  %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.body ]
  %cmp = icmp ne i32 %i.0, %width
  br i1 %cmp, label %for.body, label %for.cond.cleanup

for.cond.cleanup:                                 ; preds = %for.cond
  ret void

for.body:                                         ; preds = %for.cond
  %rem = srem i32 %i.0, 2
  %idxprom = sext i32 %rem to i64
  %0 = load <8 x i8>, <8 x i8>* %storage.apc.retyped, align 4
  %1 = bitcast <8 x i8> %0 to <2 x i32>
  %2 = extractelement <2 x i32> %1, i64 %idxprom
  %call = call i32 @_Z3adji(i32 %2)
  %3 = load <8 x i8>, <8 x i8>* %storage.apc.retyped, align 4
  %4 = bitcast <8 x i8> %3 to <2 x i32>
  %5 = extractelement <2 x i32> %4, i64 %idxprom
  %add = add nsw i32 %5, %call
  %6 = load <8 x i8>, <8 x i8>* %storage.apc.retyped, align 4
  %7 = bitcast <8 x i8> %6 to <2 x i32>
  %8 = insertelement <2 x i32> %7, i32 %add, i64 %idxprom
  %9 = bitcast <2 x i32> %8 to <8 x i8>
  store <8 x i8> %9, <8 x i8>* %storage.apc.retyped, align 4
  %inc = add nsw i32 %i.0, 1
  br label %for.cond
}

Nope, not hoisted without this patch.

That's an inconsistency. It leads to other differences, e.g.:

*** IR Dump Before Rotate Loops ***
; Preheader:
entry:
  br label %for.cond

; Loop:
for.cond:                                         ; preds = %for.body, %entry
  <badref> = phi <2 x i32> [ undef, %entry ], [ %4, %for.body ]
  %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.body ]
  <badref> = and i32 %i.0, 1
  <badref> = zext i32 %1 to i64
  %cmp = icmp eq i32 %i.0, %width
  br i1 %cmp, label %for.cond.cleanup, label %for.body

for.body:                                         ; preds = %for.cond
  <badref> = extractelement <2 x i32> %0, i64 %2
  %call = tail call i32 @_Z3adji(i32 %3)
  %add = add nsw i32 %call, %3
  <badref> = insertelement <2 x i32> %0, i32 %add, i64 %2
  %inc = add nuw nsw i32 %i.0, 1
  br label %for.cond

; Exit blocks
for.cond.cleanup:                                 ; preds = %for.cond
  ret void
*** IR Dump After Rotate Loops ***
; Preheader:
for.body.lr.ph:                                   ; preds = %entry
  br label %for.body

; Loop:
for.body:                                         ; preds = %for.body.lr.ph, %for.body
  <badref> = phi i64 [ 0, %for.body.lr.ph ], [ %5, %for.body ]
  %i.07 = phi i32 [ 0, %for.body.lr.ph ], [ %inc, %for.body ]
  <badref> = phi <2 x i32> [ undef, %for.body.lr.ph ], [ %3, %for.body ]
  <badref> = extractelement <2 x i32> %1, i64 %0
  %call = tail call i32 @_Z3adji(i32 %2)
  %add = add nsw i32 %call, %2
  <badref> = insertelement <2 x i32> %1, i32 %add, i64 %0
  %inc = add nuw nsw i32 %i.07, 1
  <badref> = and i32 %inc, 1
  <badref> = zext i32 %4 to i64
  %cmp = icmp eq i32 %inc, %width
  br i1 %cmp, label %for.cond.for.cond.cleanup_crit_edge, label %for.body

; Exit blocks
for.cond.for.cond.cleanup_crit_edge:              ; preds = %for.body
  br label %for.cond.cleanup

vs.

*** IR Dump Before Rotate Loops ***
; Preheader:
entry:
  br label %for.cond

; Loop:
for.cond:                                         ; preds = %for.body, %entry
  <badref> = phi <2 x i32> [ undef, %entry ], [ %2, %for.body ]
  %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.body ]
  %cmp = icmp eq i32 %i.0, %width
  br i1 %cmp, label %for.cond.cleanup, label %for.body

for.body:                                         ; preds = %for.cond
  %rem = and i32 %i.0, 1
  %idxprom = zext i32 %rem to i64
  <badref> = extractelement <2 x i32> %0, i64 %idxprom
  %call = tail call i32 @_Z3adji(i32 %1)
  %add = add nsw i32 %call, %1
  <badref> = insertelement <2 x i32> %0, i32 %add, i64 %idxprom
  %inc = add nuw nsw i32 %i.0, 1
  br label %for.cond

; Exit blocks
for.cond.cleanup:                                 ; preds = %for.cond
  ret void
*** IR Dump After Rotate Loops ***
; Preheader:
for.body.lr.ph:                                   ; preds = %entry
  br label %for.body

; Loop:
for.body:                                         ; preds = %for.body.lr.ph, %for.body
  %i.07 = phi i32 [ 0, %for.body.lr.ph ], [ %inc, %for.body ]
  <badref> = phi <2 x i32> [ undef, %for.body.lr.ph ], [ %2, %for.body ]
  %rem = and i32 %i.07, 1
  %idxprom = zext i32 %rem to i64
  <badref> = extractelement <2 x i32> %0, i64 %idxprom
  %call = tail call i32 @_Z3adji(i32 %1)
  %add = add nsw i32 %call, %1
  <badref> = insertelement <2 x i32> %0, i32 %add, i64 %idxprom
  %inc = add nuw nsw i32 %i.07, 1
  %cmp = icmp eq i32 %inc, %width
  br i1 %cmp, label %for.cond.for.cond.cleanup_crit_edge, label %for.body

; Exit blocks
for.cond.for.cond.cleanup_crit_edge:              ; preds = %for.body
  br label %for.cond.cleanup

I'm not going to argue which result is better, but *normally* there wouldn't be such an srem,
so the current outcome is an outlier, and i would think we would prefer to not have such odd outliers.

Addressing review notes:

Sink into createSCEV()
Use SCEV's isKnownNonNegative()
Also handle sdiv

Harbormaster failed remote builds in B62200: Diff 274203!Jun 29 2020, 1:01 PM

lebedev.ri retitled this revision from [ScalarEvolution] createSCEV(): MatchBinaryOp(): recognize `urem` disguised as an `srem` to [ScalarEvolution] createSCEV(): recognize `udiv`/`urem` disguised as an `sdiv`/`srem`.Jul 1 2020, 4:56 AM

Your transform log refers to the "rewrite allocas if that makes them promotable" pass, but I wasn't able to find it in the code base. Could you point me to where it is implemented?

In D82721#2126191, @nikic wrote:

Your transform log refers to the "rewrite allocas if that makes them promotable" pass,

I'm not sure it's material to the patch in question..

but I wasn't able to find it in the code base.

Correct. There is no such thing in llvm.

Could you point me to where it is implemented?

~~it's wip https://github.com/LebedevRI/llvm-project/tree/alloca-promotion~~

Thanks for the context! That makes it clearer what the motivation here is. You are adding a new SCEV-based pass, that runs very early in the pipeline, before even the first InstCombine run, so it needs SCEV to deal with non-canonical IR. I see you mentioned this in the description, but I was missing the "why" of it.

I'm not seeing any negative compile-time impact from this change, so this change seems ok to me.

In D82721#2126454, @nikic wrote:

Thanks for the context! That makes it clearer what the motivation here is. You are adding a new SCEV-based pass, that runs very early in the pipeline, before even the first InstCombine run, so it needs SCEV to deal with non-canonical IR. I see you mentioned this in the description, but I was missing the "why" of it.

That's the gist of it, yes.

I'm not seeing any negative compile-time impact from this change, so this change seems ok to me.

Cool, thanks for checking.

efriedma added inline comments.Jul 1 2020, 3:20 PM

llvm/test/Analysis/ScalarEvolution/sdiv.ll
17	What are you diffing against here?

lebedev.ri marked 2 inline comments as done.Jul 1 2020, 3:45 PM

lebedev.ri added inline comments.

llvm/test/Analysis/ScalarEvolution/sdiv.ll
17	Didn't push the test commit originally. Now done: rG51ff7642a33f73518d60909e3fe4e6348dcc7b27.

lebedev.ri marked an inline comment as done.Jul 1 2020, 3:46 PM

lebedev.ri planned changes to this revision.Jul 1 2020, 4:04 PM

clementval added a subscriber: clementval.Jul 1 2020, 4:34 PM

clementval added inline comments.

llvm/test/Analysis/ScalarEvolution/sdiv.ll
17	This commit is making a bunch of builedbot failing. Can you revert it?

Ok, now for real.

lebedev.ri marked an inline comment as done.Jul 1 2020, 4:36 PM

LGTM

llvm/test/Analysis/ScalarEvolution/sdiv.ll
17	Oh, that makes more sense.

This revision is now accepted and ready to land.Jul 1 2020, 5:37 PM

Harbormaster failed remote builds in B62598: Diff 274955!Jul 1 2020, 5:50 PM

In D82721#2126986, @efriedma wrote:

LGTM

Thank you for the review!

llvm/test/Analysis/ScalarEvolution/sdiv.ll
17	Yeah, somehow i ended up with wrong initial check lines, and didn't notice it, oops. Sorry.

lebedev.ri marked an inline comment as done.Jul 2 2020, 2:41 AM

Closed by commit rG2c16100e6f72: [ScalarEvolution] createSCEV(): recognize `udiv`/`urem` disguised as an… (authored by lebedev.ri). · Explain WhyJul 2 2020, 3:43 AM

This revision was automatically updated to reflect the committed changes.

Revision Contents

Path

Size

llvm/

lib/

Analysis/

ScalarEvolution.cpp

14 lines

test/

Analysis/

ScalarEvolution/

sdiv.ll

6 lines

srem.ll

6 lines

Diff 275044

llvm/lib/Analysis/ScalarEvolution.cpp

This file is larger than 256 KB, so syntax highlighting is disabled by default.

Show First 20 Lines • Show All 4,334 Lines • ▼ Show 20 Lines	if (ConstantInt *SA = dyn_cast<ConstantInt>(Op->getOperand(1))) {
Constant *X =		Constant *X =
ConstantInt::get(SA->getContext(),		ConstantInt::get(SA->getContext(),
APInt::getOneBitSet(BitWidth, SA->getZExtValue()));		APInt::getOneBitSet(BitWidth, SA->getZExtValue()));
return BinaryOp(Instruction::UDiv, Op->getOperand(0), X);		return BinaryOp(Instruction::UDiv, Op->getOperand(0), X);
}		}
}		}
return BinaryOp(Op);		return BinaryOp(Op);

case Instruction::ExtractValue: {		case Instruction::ExtractValue: {
		lebedev.riAuthorUnsubmitted Done Reply Inline Actions This is a pretty verbatim copypasta from `InstCombiner::visitSRem()` lebedev.ri: This is a pretty verbatim copypasta from `InstCombiner::visitSRem()`
auto *EVI = cast<ExtractValueInst>(Op);		auto *EVI = cast<ExtractValueInst>(Op);
		efriedmaUnsubmitted Done Reply Inline Actions Can we stick this code into ScalarEvolution::createSCEV directly? I don't think any of the other users of MatchBinaryOp care whether they get a urem or an srem. Can we use the same code for sdiv? efriedma: Can we stick this code into ScalarEvolution::createSCEV directly? I don't think any of the…
if (EVI->getNumIndices() != 1 \|\| EVI->getIndices()[0] != 0)		if (EVI->getNumIndices() != 1 \|\| EVI->getIndices()[0] != 0)
break;		break;

auto *WO = dyn_cast<WithOverflowInst>(EVI->getAggregateOperand());		auto *WO = dyn_cast<WithOverflowInst>(EVI->getAggregateOperand());
if (!WO)		if (!WO)
break;		break;
		efriedmaUnsubmitted Done Reply Inline Actions Can we not use isKnownNonNegative? efriedma: Can we not use isKnownNonNegative?

Instruction::BinaryOps BinOp = WO->getBinaryOp();		Instruction::BinaryOps BinOp = WO->getBinaryOp();
bool Signed = WO->isSigned();		bool Signed = WO->isSigned();
// TODO: Should add nuw/nsw flags for mul as well.		// TODO: Should add nuw/nsw flags for mul as well.
if (BinOp == Instruction::Mul \|\| !isOverflowIntrinsicNoWrap(WO, DT))		if (BinOp == Instruction::Mul \|\| !isOverflowIntrinsicNoWrap(WO, DT))
return BinaryOp(BinOp, WO->getLHS(), WO->getRHS());		return BinaryOp(BinOp, WO->getLHS(), WO->getRHS());

// Now that we know that all uses of the arithmetic-result component of		// Now that we know that all uses of the arithmetic-result component of
▲ Show 20 Lines • Show All 1,939 Lines • ▼ Show 20 Lines	case Instruction::SExt:
return getSignExtendExpr(getSCEV(U->getOperand(0)), U->getType());		return getSignExtendExpr(getSCEV(U->getOperand(0)), U->getType());

case Instruction::BitCast:		case Instruction::BitCast:
// BitCasts are no-op casts so we just eliminate the cast.		// BitCasts are no-op casts so we just eliminate the cast.
if (isSCEVable(U->getType()) && isSCEVable(U->getOperand(0)->getType()))		if (isSCEVable(U->getType()) && isSCEVable(U->getOperand(0)->getType()))
return getSCEV(U->getOperand(0));		return getSCEV(U->getOperand(0));
break;		break;

		case Instruction::SDiv:
		// If both operands are non-negative, this is just an udiv.
		if (isKnownNonNegative(getSCEV(U->getOperand(0))) &&
		isKnownNonNegative(getSCEV(U->getOperand(1))))
		return getUDivExpr(getSCEV(U->getOperand(0)), getSCEV(U->getOperand(1)));
		break;

		case Instruction::SRem:
		// If both operands are non-negative, this is just an urem.
		if (isKnownNonNegative(getSCEV(U->getOperand(0))) &&
		isKnownNonNegative(getSCEV(U->getOperand(1))))
		return getURemExpr(getSCEV(U->getOperand(0)), getSCEV(U->getOperand(1)));
		break;

// It's tempting to handle inttoptr and ptrtoint as no-ops, however this can		// It's tempting to handle inttoptr and ptrtoint as no-ops, however this can
// lead to pointer expressions which cannot safely be expanded to GEPs,		// lead to pointer expressions which cannot safely be expanded to GEPs,
// because ScalarEvolution doesn't respect the GEP aliasing rules when		// because ScalarEvolution doesn't respect the GEP aliasing rules when
// simplifying integer expressions.		// simplifying integer expressions.

case Instruction::GetElementPtr:		case Instruction::GetElementPtr:
return createNodeForGEP(cast<GEPOperator>(U));		return createNodeForGEP(cast<GEPOperator>(U));

▲ Show 20 Lines • Show All 6,145 Lines • Show Last 20 Lines

llvm/test/Analysis/ScalarEvolution/sdiv.ll

	; NOTE: Assertions have been autogenerated by utils/update_analyze_test_checks.py			; NOTE: Assertions have been autogenerated by utils/update_analyze_test_checks.py
	; RUN: opt < %s -scalar-evolution -analyze \| FileCheck %s			; RUN: opt < %s -scalar-evolution -analyze \| FileCheck %s

	target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-f80:128-n8:16:32:64-S128"			target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-f80:128-n8:16:32:64-S128"
	target triple = "x86_64-unknown-linux-gnu"			target triple = "x86_64-unknown-linux-gnu"

	define dso_local void @_Z4loopi(i32 %width) local_unnamed_addr #0 {			define dso_local void @_Z4loopi(i32 %width) local_unnamed_addr #0 {
	; CHECK-LABEL: '_Z4loopi'			; CHECK-LABEL: '_Z4loopi'
	; CHECK-NEXT: Classifying expressions for: @_Z4loopi			; CHECK-NEXT: Classifying expressions for: @_Z4loopi
	; CHECK-NEXT: %storage = alloca [2 x i32], align 4			; CHECK-NEXT: %storage = alloca [2 x i32], align 4
	; CHECK-NEXT: --> %storage U: [0,-3) S: [-9223372036854775808,9223372036854775805)			; CHECK-NEXT: --> %storage U: [0,-3) S: [-9223372036854775808,9223372036854775805)
	; CHECK-NEXT: %0 = bitcast [2 x i32]* %storage to i8*			; CHECK-NEXT: %0 = bitcast [2 x i32]* %storage to i8*
	; CHECK-NEXT: --> %storage U: [0,-3) S: [-9223372036854775808,9223372036854775805)			; CHECK-NEXT: --> %storage U: [0,-3) S: [-9223372036854775808,9223372036854775805)
	; CHECK-NEXT: %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.body ]			; CHECK-NEXT: %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.body ]
	; CHECK-NEXT: --> {0,+,1}<nuw><nsw><%for.cond> U: [0,-2147483648) S: [0,-2147483648) Exits: %width LoopDispositions: { %for.cond: Computable }			; CHECK-NEXT: --> {0,+,1}<nuw><nsw><%for.cond> U: [0,-2147483648) S: [0,-2147483648) Exits: %width LoopDispositions: { %for.cond: Computable }
	; CHECK-NEXT: %rem = sdiv i32 %i.0, 2			; CHECK-NEXT: %rem = sdiv i32 %i.0, 2
	; CHECK-NEXT: --> %rem U: full-set S: [-1073741824,1073741824) Exits: <<Unknown>> LoopDispositions: { %for.cond: Variant }			; CHECK-NEXT: --> ({0,+,1}<nuw><nsw><%for.cond> /u 2) U: [0,1073741824) S: [0,1073741824) Exits: (%width /u 2) LoopDispositions: { %for.cond: Computable }
	efriedmaUnsubmitted Done Reply Inline Actions What are you diffing against here? efriedma: What are you diffing against here?
	lebedev.riAuthorUnsubmitted Done Reply Inline Actions Didn't push the test commit originally. Now done: rG51ff7642a33f73518d60909e3fe4e6348dcc7b27. lebedev.ri: Didn't push the test commit originally. Now done: rG51ff7642a33f73518d60909e3fe4e6348dcc7b27.
	clementvalUnsubmitted Done Reply Inline Actions This commit is making a bunch of builedbot failing. Can you revert it? clementval: This commit is making a bunch of builedbot failing. Can you revert it?
	efriedmaUnsubmitted Done Reply Inline Actions Oh, that makes more sense. efriedma: Oh, that makes more sense.
	lebedev.riAuthorUnsubmitted Done Reply Inline Actions Yeah, somehow i ended up with wrong initial check lines, and didn't notice it, oops. Sorry. lebedev.ri: Yeah, somehow i ended up with wrong initial check lines, and didn't notice it, oops. Sorry.
	; CHECK-NEXT: %idxprom = sext i32 %rem to i64			; CHECK-NEXT: %idxprom = sext i32 %rem to i64
	; CHECK-NEXT: --> (sext i32 %rem to i64) U: [-2147483648,2147483648) S: [-1073741824,1073741824) Exits: <<Unknown>> LoopDispositions: { %for.cond: Variant }			; CHECK-NEXT: --> ({0,+,1}<nuw><nsw><%for.cond> /u 2) U: [0,2147483648) S: [0,2147483648) Exits: ((zext i32 %width to i64) /u 2) LoopDispositions: { %for.cond: Computable }
	; CHECK-NEXT: %arrayidx = getelementptr inbounds [2 x i32], [2 x i32]* %storage, i64 0, i64 %idxprom			; CHECK-NEXT: %arrayidx = getelementptr inbounds [2 x i32], [2 x i32]* %storage, i64 0, i64 %idxprom
	; CHECK-NEXT: --> ((4 * (sext i32 %rem to i64))<nsw> + %storage)<nsw> U: [0,-3) S: [-9223372036854775808,9223372036854775805) Exits: <<Unknown>> LoopDispositions: { %for.cond: Variant }			; CHECK-NEXT: --> ((4 * ({0,+,1}<nuw><nsw><%for.cond> /u 2))<nuw><nsw> + %storage)<nsw> U: [0,-3) S: [-9223372036854775808,9223372036854775805) Exits: ((4 * ((zext i32 %width to i64) /u 2))<nuw><nsw> + %storage)<nsw> LoopDispositions: { %for.cond: Computable }
	; CHECK-NEXT: %1 = load i32, i32* %arrayidx, align 4			; CHECK-NEXT: %1 = load i32, i32* %arrayidx, align 4
	; CHECK-NEXT: --> %1 U: full-set S: full-set Exits: <<Unknown>> LoopDispositions: { %for.cond: Variant }			; CHECK-NEXT: --> %1 U: full-set S: full-set Exits: <<Unknown>> LoopDispositions: { %for.cond: Variant }
	; CHECK-NEXT: %call = call i32 @_Z3adji(i32 %1)			; CHECK-NEXT: %call = call i32 @_Z3adji(i32 %1)
	; CHECK-NEXT: --> %call U: full-set S: full-set Exits: <<Unknown>> LoopDispositions: { %for.cond: Variant }			; CHECK-NEXT: --> %call U: full-set S: full-set Exits: <<Unknown>> LoopDispositions: { %for.cond: Variant }
	; CHECK-NEXT: %2 = load i32, i32* %arrayidx, align 4			; CHECK-NEXT: %2 = load i32, i32* %arrayidx, align 4
	; CHECK-NEXT: --> %2 U: full-set S: full-set Exits: <<Unknown>> LoopDispositions: { %for.cond: Variant }			; CHECK-NEXT: --> %2 U: full-set S: full-set Exits: <<Unknown>> LoopDispositions: { %for.cond: Variant }
	; CHECK-NEXT: %add = add nsw i32 %2, %call			; CHECK-NEXT: %add = add nsw i32 %2, %call
	; CHECK-NEXT: --> (%2 + %call) U: full-set S: full-set Exits: <<Unknown>> LoopDispositions: { %for.cond: Variant }			; CHECK-NEXT: --> (%2 + %call) U: full-set S: full-set Exits: <<Unknown>> LoopDispositions: { %for.cond: Variant }
	▲ Show 20 Lines • Show All 45 Lines • Show Last 20 Lines

llvm/test/Analysis/ScalarEvolution/srem.ll

	; NOTE: Assertions have been autogenerated by utils/update_analyze_test_checks.py			; NOTE: Assertions have been autogenerated by utils/update_analyze_test_checks.py
	; RUN: opt < %s -scalar-evolution -analyze \| FileCheck %s			; RUN: opt < %s -scalar-evolution -analyze \| FileCheck %s

	target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-f80:128-n8:16:32:64-S128"			target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-f80:128-n8:16:32:64-S128"
	target triple = "x86_64-unknown-linux-gnu"			target triple = "x86_64-unknown-linux-gnu"

	define dso_local void @_Z4loopi(i32 %width) local_unnamed_addr #0 {			define dso_local void @_Z4loopi(i32 %width) local_unnamed_addr #0 {
	; CHECK-LABEL: '_Z4loopi'			; CHECK-LABEL: '_Z4loopi'
	; CHECK-NEXT: Classifying expressions for: @_Z4loopi			; CHECK-NEXT: Classifying expressions for: @_Z4loopi
	; CHECK-NEXT: %storage = alloca [2 x i32], align 4			; CHECK-NEXT: %storage = alloca [2 x i32], align 4
	; CHECK-NEXT: --> %storage U: [0,-3) S: [-9223372036854775808,9223372036854775805)			; CHECK-NEXT: --> %storage U: [0,-3) S: [-9223372036854775808,9223372036854775805)
	; CHECK-NEXT: %0 = bitcast [2 x i32]* %storage to i8*			; CHECK-NEXT: %0 = bitcast [2 x i32]* %storage to i8*
	; CHECK-NEXT: --> %storage U: [0,-3) S: [-9223372036854775808,9223372036854775805)			; CHECK-NEXT: --> %storage U: [0,-3) S: [-9223372036854775808,9223372036854775805)
	; CHECK-NEXT: %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.body ]			; CHECK-NEXT: %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.body ]
	; CHECK-NEXT: --> {0,+,1}<nuw><nsw><%for.cond> U: [0,-2147483648) S: [0,-2147483648) Exits: %width LoopDispositions: { %for.cond: Computable }			; CHECK-NEXT: --> {0,+,1}<nuw><nsw><%for.cond> U: [0,-2147483648) S: [0,-2147483648) Exits: %width LoopDispositions: { %for.cond: Computable }
	; CHECK-NEXT: %rem = srem i32 %i.0, 2			; CHECK-NEXT: %rem = srem i32 %i.0, 2
	; CHECK-NEXT: --> %rem U: [0,2) S: [-2,2) Exits: <<Unknown>> LoopDispositions: { %for.cond: Variant }			; CHECK-NEXT: --> (zext i1 {false,+,true}<%for.cond> to i32) U: [0,2) S: [0,2) Exits: (zext i1 (trunc i32 %width to i1) to i32) LoopDispositions: { %for.cond: Computable }
	; CHECK-NEXT: %idxprom = sext i32 %rem to i64			; CHECK-NEXT: %idxprom = sext i32 %rem to i64
	; CHECK-NEXT: --> (sext i32 %rem to i64) U: [0,2) S: [-2,2) Exits: <<Unknown>> LoopDispositions: { %for.cond: Variant }			; CHECK-NEXT: --> (zext i1 {false,+,true}<%for.cond> to i64) U: [0,2) S: [0,2) Exits: (zext i1 (trunc i32 %width to i1) to i64) LoopDispositions: { %for.cond: Computable }
	; CHECK-NEXT: %arrayidx = getelementptr inbounds [2 x i32], [2 x i32]* %storage, i64 0, i64 %idxprom			; CHECK-NEXT: %arrayidx = getelementptr inbounds [2 x i32], [2 x i32]* %storage, i64 0, i64 %idxprom
	; CHECK-NEXT: --> ((4 * (sext i32 %rem to i64))<nuw><nsw> + %storage)<nsw> U: [0,-3) S: [-9223372036854775808,9223372036854775805) Exits: <<Unknown>> LoopDispositions: { %for.cond: Variant }			; CHECK-NEXT: --> ((4 * (zext i1 {false,+,true}<%for.cond> to i64))<nuw><nsw> + %storage)<nsw> U: [0,-3) S: [-9223372036854775808,9223372036854775805) Exits: ((4 * (zext i1 (trunc i32 %width to i1) to i64))<nuw><nsw> + %storage)<nsw> LoopDispositions: { %for.cond: Computable }
	; CHECK-NEXT: %1 = load i32, i32* %arrayidx, align 4			; CHECK-NEXT: %1 = load i32, i32* %arrayidx, align 4
	; CHECK-NEXT: --> %1 U: full-set S: full-set Exits: <<Unknown>> LoopDispositions: { %for.cond: Variant }			; CHECK-NEXT: --> %1 U: full-set S: full-set Exits: <<Unknown>> LoopDispositions: { %for.cond: Variant }
	; CHECK-NEXT: %call = call i32 @_Z3adji(i32 %1)			; CHECK-NEXT: %call = call i32 @_Z3adji(i32 %1)
	; CHECK-NEXT: --> %call U: full-set S: full-set Exits: <<Unknown>> LoopDispositions: { %for.cond: Variant }			; CHECK-NEXT: --> %call U: full-set S: full-set Exits: <<Unknown>> LoopDispositions: { %for.cond: Variant }
	; CHECK-NEXT: %2 = load i32, i32* %arrayidx, align 4			; CHECK-NEXT: %2 = load i32, i32* %arrayidx, align 4
	; CHECK-NEXT: --> %2 U: full-set S: full-set Exits: <<Unknown>> LoopDispositions: { %for.cond: Variant }			; CHECK-NEXT: --> %2 U: full-set S: full-set Exits: <<Unknown>> LoopDispositions: { %for.cond: Variant }
	; CHECK-NEXT: %add = add nsw i32 %2, %call			; CHECK-NEXT: %add = add nsw i32 %2, %call
	; CHECK-NEXT: --> (%2 + %call) U: full-set S: full-set Exits: <<Unknown>> LoopDispositions: { %for.cond: Variant }			; CHECK-NEXT: --> (%2 + %call) U: full-set S: full-set Exits: <<Unknown>> LoopDispositions: { %for.cond: Variant }
	▲ Show 20 Lines • Show All 45 Lines • Show Last 20 Lines