Index: include/llvm/Analysis/ScalarEvolution.h =================================================================== --- include/llvm/Analysis/ScalarEvolution.h +++ include/llvm/Analysis/ScalarEvolution.h @@ -1265,6 +1265,7 @@ } const SCEV *getUDivExpr(const SCEV *LHS, const SCEV *RHS); const SCEV *getUDivExactExpr(const SCEV *LHS, const SCEV *RHS); + const SCEV *getURemExpr(const SCEV *LHS, const SCEV *RHS); const SCEV *getAddRecExpr(const SCEV *Start, const SCEV *Step, const Loop *L, SCEV::NoWrapFlags Flags); const SCEV *getAddRecExpr(SmallVectorImpl &Operands, Index: lib/Analysis/ScalarEvolution.cpp =================================================================== --- lib/Analysis/ScalarEvolution.cpp +++ lib/Analysis/ScalarEvolution.cpp @@ -2945,6 +2945,34 @@ return getOrCreateMulExpr(Ops, Flags); } +/// Represents an unsigned remainder expression based on unsigned division. +const SCEV *ScalarEvolution::getURemExpr(const SCEV *LHS, + const SCEV *RHS) { + assert(getEffectiveSCEVType(LHS->getType()) == + getEffectiveSCEVType(RHS->getType()) && + "SCEVURemExpr operand types don't match!"); + + // Short-circuit easy cases + if (const SCEVConstant *RHSC = dyn_cast(RHS)) { + // If constant is one, the result is trivial + if (RHSC->getValue()->isOne()) + return getZero(LHS->getType()); // X urem 1 --> 0 + + // If constant is a power of two, fold into a zext(trunc(LHS)). + if (RHSC->getAPInt().isPowerOf2()) { + Type *FullTy = LHS->getType(); + Type *TruncTy = + IntegerType::get(getContext(), RHSC->getAPInt().logBase2()); + return getZeroExtendExpr(getTruncateExpr(LHS, TruncTy), FullTy); + } + } + + // Fallback to %a == %x urem %y == %x - ((%x udiv %y) * %y) + const SCEV *UDiv = getUDivExpr(LHS, RHS); + const SCEV *Mult = getMulExpr(UDiv, RHS, SCEV::FlagNUW); + return getMinusSCEV(LHS, Mult, SCEV::FlagNUW); +} + /// Get a canonical unsigned division expression, or something simpler if /// possible. const SCEV *ScalarEvolution::getUDivExpr(const SCEV *LHS, @@ -4105,6 +4133,7 @@ case Instruction::Sub: case Instruction::Mul: case Instruction::UDiv: + case Instruction::URem: case Instruction::And: case Instruction::Or: case Instruction::AShr: @@ -5750,6 +5779,8 @@ } case Instruction::UDiv: return getUDivExpr(getSCEV(BO->LHS), getSCEV(BO->RHS)); + case Instruction::URem: + return getURemExpr(getSCEV(BO->LHS), getSCEV(BO->RHS)); case Instruction::Sub: { SCEV::NoWrapFlags Flags = SCEV::FlagAnyWrap; if (BO->Op) Index: test/Analysis/ScalarEvolution/flattened-0.ll =================================================================== --- test/Analysis/ScalarEvolution/flattened-0.ll +++ test/Analysis/ScalarEvolution/flattened-0.ll @@ -0,0 +1,22 @@ +; RUN: opt < %s -scalar-evolution -analyze | FileCheck %s + +define void @foo([7 x i8]* %a) { +; CHECK-LABEL: @foo +entry: + br label %bb + +bb: + %idx = phi i64 [ 0, %entry ], [ %idx.incr, %bb ] + %i = udiv i64 %idx, 7 + %j = urem i64 %idx, 7 + %a.ptr = getelementptr [7 x i8], [7 x i8]* %a, i64 %i, i64 %j +; CHECK: %a.ptr = getelementptr [7 x i8], [7 x i8]* %a, i64 %i, i64 %j +; CHECK-NEXT: --> {%a,+,1}<%bb> + %val = load i8, i8* %a.ptr + %idx.incr = add i64 %idx, 1 + %test = icmp ne i64 %idx.incr, 35 + br i1 %test, label %bb, label %exit + +exit: + ret void +} Index: test/Analysis/ScalarEvolution/urem-0.ll =================================================================== --- test/Analysis/ScalarEvolution/urem-0.ll +++ test/Analysis/ScalarEvolution/urem-0.ll @@ -1,15 +1,33 @@ ; RUN: opt < %s -scalar-evolution -analyze | FileCheck %s define i8 @foo(i8 %a) { +; CHECK-LABEL: @foo %t0 = urem i8 %a, 27 -; CHECK: %t0 +; CHECK: %t0 = urem i8 %a, 27 ; CHECK-NEXT: --> ((-27 * (%a /u 27)) + %a) ret i8 %t0 } define i8 @bar(i8 %a) { +; CHECK-LABEL: @bar %t1 = urem i8 %a, 1 -; CHECK: %t1 +; CHECK: %t1 = urem i8 %a, 1 ; CHECK-NEXT: --> 0 ret i8 %t1 } + +define i8 @baz(i8 %a) { +; CHECK-LABEL: @baz + %t2 = urem i8 %a, 32 +; CHECK: %t2 = urem i8 %a, 32 +; CHECK-NEXT: --> (zext i5 (trunc i8 %a to i5) to i8) + ret i8 %t2 +} + +define i8 @qux(i8 %a) { +; CHECK-LABEL: @qux + %t3 = urem i8 %a, 2 +; CHECK: %t3 = urem i8 %a, 2 +; CHECK-NEXT: --> (zext i1 (trunc i8 %a to i1) to i8) + ret i8 %t3 +}