diff --git a/llvm/lib/Transforms/Scalar/LoopInterchange.cpp b/llvm/lib/Transforms/Scalar/LoopInterchange.cpp
--- a/llvm/lib/Transforms/Scalar/LoopInterchange.cpp
+++ b/llvm/lib/Transforms/Scalar/LoopInterchange.cpp
@@ -334,7 +334,7 @@
 
   /// Check if the loop structure is understood. We do not handle triangular
   /// loops for now.
-  bool isLoopStructureUnderstood(PHINode *InnerInductionVar);
+  bool isLoopStructureUnderstood();
 
   bool currentLimitations();
 
@@ -342,6 +342,10 @@
     return OuterInnerReductions;
   }
 
+  const SmallVectorImpl<PHINode *> &getInnerLoopInductions() const {
+    return InnerLoopInductions;
+  }
+
 private:
   bool tightlyNested(Loop *Outer, Loop *Inner);
   bool containsUnsafeInstructions(BasicBlock *BB);
@@ -365,6 +369,9 @@
   /// Set of reduction PHIs taking part of a reduction across the inner and
   /// outer loop.
   SmallPtrSet<PHINode *, 4> OuterInnerReductions;
+
+  /// Set of inner loop induction PHIs
+  SmallVector<PHINode *, 8> InnerLoopInductions;
 };
 
 /// LoopInterchangeProfitability checks if it is profitable to interchange the
@@ -635,25 +642,26 @@
   return true;
 }
 
-bool LoopInterchangeLegality::isLoopStructureUnderstood(
-    PHINode *InnerInduction) {
-  unsigned Num = InnerInduction->getNumOperands();
+bool LoopInterchangeLegality::isLoopStructureUnderstood() {
   BasicBlock *InnerLoopPreheader = InnerLoop->getLoopPreheader();
-  for (unsigned i = 0; i < Num; ++i) {
-    Value *Val = InnerInduction->getOperand(i);
-    if (isa<Constant>(Val))
-      continue;
-    Instruction *I = dyn_cast<Instruction>(Val);
-    if (!I)
-      return false;
-    // TODO: Handle triangular loops.
-    // e.g. for(int i=0;i<N;i++)
-    //        for(int j=i;j<N;j++)
-    unsigned IncomBlockIndx = PHINode::getIncomingValueNumForOperand(i);
-    if (InnerInduction->getIncomingBlock(IncomBlockIndx) ==
-            InnerLoopPreheader &&
-        !OuterLoop->isLoopInvariant(I)) {
-      return false;
+  for (PHINode *InnerInduction : InnerLoopInductions) {
+    unsigned Num = InnerInduction->getNumOperands();
+    for (unsigned i = 0; i < Num; ++i) {
+      Value *Val = InnerInduction->getOperand(i);
+      if (isa<Constant>(Val))
+        continue;
+      Instruction *I = dyn_cast<Instruction>(Val);
+      if (!I)
+        return false;
+      // TODO: Handle triangular loops.
+      // e.g. for(int i=0;i<N;i++)
+      //        for(int j=i;j<N;j++)
+      unsigned IncomBlockIndx = PHINode::getIncomingValueNumForOperand(i);
+      if (InnerInduction->getIncomingBlock(IncomBlockIndx) ==
+              InnerLoopPreheader &&
+          !OuterLoop->isLoopInvariant(I)) {
+        return false;
+      }
     }
   }
 
@@ -683,12 +691,12 @@
     // InnerInduction, or a binary operator that involves
     // InnerInduction and a constant.
     std::function<bool(Value *)> IsPathToIndVar;
-    IsPathToIndVar = [&InnerInduction, &IsPathToIndVar](Value *V) -> bool {
-      if (V == InnerInduction)
+    IsPathToIndVar = [this, &IsPathToIndVar](const Value *V) -> bool {
+      if (llvm::is_contained(InnerLoopInductions, V))
         return true;
       if (isa<Constant>(V))
         return true;
-      Instruction *I = dyn_cast<Instruction>(V);
+      const Instruction *I = dyn_cast<Instruction>(V);
       if (!I)
         return false;
       if (isa<CastInst>(I))
@@ -699,6 +707,13 @@
       return false;
     };
 
+    // In case of multiple inner loop indvars, it is okay if LHS and RHS
+    // are both inner indvar related variables.
+    if (IsPathToIndVar(Op0) && IsPathToIndVar(Op1))
+      return true;
+
+    // Otherwise we check if the cmp instruction compares an inner indvar
+    // related variable (Left) with a outer loop invariant (Right).
     if (IsPathToIndVar(Op0) && !isa<Constant>(Op0)) {
       Left = Op0;
       Right = Op1;
@@ -815,7 +830,6 @@
     return true;
   }
 
-  PHINode *InnerInductionVar;
   SmallVector<PHINode *, 8> Inductions;
   if (!findInductionAndReductions(OuterLoop, Inductions, InnerLoop)) {
     LLVM_DEBUG(
@@ -859,25 +873,11 @@
     });
     return true;
   }
-
-  // TODO: Currently we handle only loops with 1 induction variable.
-  if (Inductions.size() != 1) {
-    LLVM_DEBUG(
-        dbgs() << "We currently only support loops with 1 induction variable."
-               << "Failed to interchange due to current limitation\n");
-    ORE->emit([&]() {
-      return OptimizationRemarkMissed(DEBUG_TYPE, "MultiInductionInner",
-                                      InnerLoop->getStartLoc(),
-                                      InnerLoop->getHeader())
-             << "Only inner loops with 1 induction variable can be "
-                "interchanged currently.";
-    });
-    return true;
-  }
-  InnerInductionVar = Inductions.pop_back_val();
+  // Copy over to the set of inner loop indvars which will be used later.
+  InnerLoopInductions = Inductions;
 
   // TODO: Triangular loops are not handled for now.
-  if (!isLoopStructureUnderstood(InnerInductionVar)) {
+  if (!isLoopStructureUnderstood()) {
     LLVM_DEBUG(dbgs() << "Loop structure not understood by pass\n");
     ORE->emit([&]() {
       return OptimizationRemarkMissed(DEBUG_TYPE, "UnsupportedStructureInner",
@@ -888,78 +888,6 @@
     return true;
   }
 
-  // TODO: Current limitation: Since we split the inner loop latch at the point
-  // were induction variable is incremented (induction.next); We cannot have
-  // more than 1 user of induction.next since it would result in broken code
-  // after split.
-  // e.g.
-  // for(i=0;i<N;i++) {
-  //    for(j = 0;j<M;j++) {
-  //      A[j+1][i+2] = A[j][i]+k;
-  //  }
-  // }
-  Instruction *InnerIndexVarInc = nullptr;
-  if (InnerInductionVar->getIncomingBlock(0) == InnerLoopPreHeader)
-    InnerIndexVarInc =
-        dyn_cast<Instruction>(InnerInductionVar->getIncomingValue(1));
-  else
-    InnerIndexVarInc =
-        dyn_cast<Instruction>(InnerInductionVar->getIncomingValue(0));
-
-  if (!InnerIndexVarInc) {
-    LLVM_DEBUG(
-        dbgs() << "Did not find an instruction to increment the induction "
-               << "variable.\n");
-    ORE->emit([&]() {
-      return OptimizationRemarkMissed(DEBUG_TYPE, "NoIncrementInInner",
-                                      InnerLoop->getStartLoc(),
-                                      InnerLoop->getHeader())
-             << "The inner loop does not increment the induction variable.";
-    });
-    return true;
-  }
-
-  // Since we split the inner loop latch on this induction variable. Make sure
-  // we do not have any instruction between the induction variable and branch
-  // instruction.
-
-  bool FoundInduction = false;
-  for (const Instruction &I :
-       llvm::reverse(InnerLoopLatch->instructionsWithoutDebug())) {
-    if (isa<BranchInst>(I) || isa<CmpInst>(I) || isa<TruncInst>(I) ||
-        isa<ZExtInst>(I))
-      continue;
-
-    // We found an instruction. If this is not induction variable then it is not
-    // safe to split this loop latch.
-    if (!I.isIdenticalTo(InnerIndexVarInc)) {
-      LLVM_DEBUG(dbgs() << "Found unsupported instructions between induction "
-                        << "variable increment and branch.\n");
-      ORE->emit([&]() {
-        return OptimizationRemarkMissed(
-                   DEBUG_TYPE, "UnsupportedInsBetweenInduction",
-                   InnerLoop->getStartLoc(), InnerLoop->getHeader())
-               << "Found unsupported instruction between induction variable "
-                  "increment and branch.";
-      });
-      return true;
-    }
-
-    FoundInduction = true;
-    break;
-  }
-  // The loop latch ended and we didn't find the induction variable return as
-  // current limitation.
-  if (!FoundInduction) {
-    LLVM_DEBUG(dbgs() << "Did not find the induction variable.\n");
-    ORE->emit([&]() {
-      return OptimizationRemarkMissed(DEBUG_TYPE, "NoIndutionVariable",
-                                      InnerLoop->getStartLoc(),
-                                      InnerLoop->getHeader())
-             << "Did not find the induction variable.";
-    });
-    return true;
-  }
   return false;
 }
 
@@ -1347,25 +1275,25 @@
 
 bool LoopInterchangeTransform::transform() {
   bool Transformed = false;
-  Instruction *InnerIndexVar;
 
   if (InnerLoop->getSubLoops().empty()) {
     BasicBlock *InnerLoopPreHeader = InnerLoop->getLoopPreheader();
     LLVM_DEBUG(dbgs() << "Splitting the inner loop latch\n");
-    PHINode *InductionPHI = getInductionVariable(InnerLoop, SE);
-    if (!InductionPHI) {
+    auto &InductionPHIs = LIL.getInnerLoopInductions();
+    if (InductionPHIs.empty()) {
       LLVM_DEBUG(dbgs() << "Failed to find the point to split loop latch \n");
       return false;
     }
 
-    if (InductionPHI->getIncomingBlock(0) == InnerLoopPreHeader)
-      InnerIndexVar = dyn_cast<Instruction>(InductionPHI->getIncomingValue(1));
-    else
-      InnerIndexVar = dyn_cast<Instruction>(InductionPHI->getIncomingValue(0));
-
-    // Ensure that InductionPHI is the first Phi node.
-    if (&InductionPHI->getParent()->front() != InductionPHI)
-      InductionPHI->moveBefore(&InductionPHI->getParent()->front());
+    SmallVector<Instruction *, 8> InnerIndexVarList;
+    for (PHINode *CurInductionPHI : InductionPHIs) {
+      if (CurInductionPHI->getIncomingBlock(0) == InnerLoopPreHeader)
+        InnerIndexVarList.push_back(
+            dyn_cast<Instruction>(CurInductionPHI->getIncomingValue(1)));
+      else
+        InnerIndexVarList.push_back(
+            dyn_cast<Instruction>(CurInductionPHI->getIncomingValue(0)));
+    }
 
     // Create a new latch block for the inner loop. We split at the
     // current latch's terminator and then move the condition and all
@@ -1377,7 +1305,7 @@
 
     SmallSetVector<Instruction *, 4> WorkList;
     unsigned i = 0;
-    auto MoveInstructions = [&i, &WorkList, this, InductionPHI, NewLatch]() {
+    auto MoveInstructions = [&i, &WorkList, this, &InductionPHIs, NewLatch]() {
       for (; i < WorkList.size(); i++) {
         // Duplicate instruction and move it the new latch. Update uses that
         // have been moved.
@@ -1389,7 +1317,8 @@
         for (Use &U : llvm::make_early_inc_range(WorkList[i]->uses())) {
           Instruction *UserI = cast<Instruction>(U.getUser());
           if (!InnerLoop->contains(UserI->getParent()) ||
-              UserI->getParent() == NewLatch || UserI == InductionPHI)
+              UserI->getParent() == NewLatch ||
+              llvm::is_contained(InductionPHIs, UserI))
             U.set(NewI);
         }
         // Add operands of moved instruction to the worklist, except if they are
@@ -1398,7 +1327,7 @@
           Instruction *OpI = dyn_cast<Instruction>(Op);
           if (!OpI ||
               this->LI->getLoopFor(OpI->getParent()) != this->InnerLoop ||
-              OpI == InductionPHI)
+              llvm::is_contained(InductionPHIs, OpI))
             continue;
           WorkList.insert(OpI);
         }
@@ -1412,7 +1341,8 @@
     if (CondI)
       WorkList.insert(CondI);
     MoveInstructions();
-    WorkList.insert(cast<Instruction>(InnerIndexVar));
+    for (Instruction *InnerIndexVar : InnerIndexVarList)
+      WorkList.insert(cast<Instruction>(InnerIndexVar));
     MoveInstructions();
 
     // Splits the inner loops phi nodes out into a separate basic block.
@@ -1685,7 +1615,6 @@
   updateSuccessor(InnerLoopLatchPredecessorBI, InnerLoopLatch,
                   InnerLoopLatchSuccessor, DTUpdates);
 
-
   if (OuterLoopLatchBI->getSuccessor(0) == OuterLoopHeader)
     OuterLoopLatchSuccessor = OuterLoopLatchBI->getSuccessor(1);
   else
@@ -1712,7 +1641,8 @@
   SmallVector<PHINode *, 4> InnerLoopPHIs, OuterLoopPHIs;
   for (PHINode &PHI : InnerLoopHeader->phis())
     if (OuterInnerReductions.contains(&PHI))
-      InnerLoopPHIs.push_back(cast<PHINode>(&PHI));
+      InnerLoopPHIs.push_back(&PHI);
+
   for (PHINode &PHI : OuterLoopHeader->phis())
     if (OuterInnerReductions.contains(&PHI))
       OuterLoopPHIs.push_back(cast<PHINode>(&PHI));
@@ -1725,6 +1655,7 @@
     assert(OuterInnerReductions.count(PHI) && "Expected a reduction PHI node");
   }
   for (PHINode *PHI : InnerLoopPHIs) {
+    LLVM_DEBUG(dbgs() << "Inner loop reduction PHIs:\n"; PHI->dump(););
     PHI->moveBefore(OuterLoopHeader->getFirstNonPHI());
     assert(OuterInnerReductions.count(PHI) && "Expected a reduction PHI node");
   }
diff --git a/llvm/test/Transforms/LoopInterchange/interchangeable-innerloop-multiple-indvars.ll b/llvm/test/Transforms/LoopInterchange/interchangeable-innerloop-multiple-indvars.ll
new file mode 100644
--- /dev/null
+++ b/llvm/test/Transforms/LoopInterchange/interchangeable-innerloop-multiple-indvars.ll
@@ -0,0 +1,283 @@
+; RUN: opt < %s -basic-aa -loop-interchange -verify-dom-info -verify-loop-info -verify-scev -verify-loop-lcssa -S | FileCheck %s
+
+@c = common dso_local local_unnamed_addr global i32 0, align 4
+@d = common dso_local local_unnamed_addr global i32 0, align 4
+@e = common dso_local local_unnamed_addr global i32 0, align 4
+@b = common dso_local local_unnamed_addr global [200 x [200 x i32]] zeroinitializer, align 4
+@a = common dso_local local_unnamed_addr global i32 0, align 4
+
+;; int a, c, d, e;
+;; int b[200][200];
+;; void fn1() {
+;;   for (; c; c++) {
+;;     d = 5;
+;;     e = 5;
+;;     for (; d, e; d--, e--)
+;;       a |= b[d][c + 9];
+;;   }
+;; }
+;
+; There are multiple inner loop indvars and only one 
+; of them is used in the loop exit condition at the
+; inner loop latch.
+;
+define void @test1() {
+; CHECK-LABEL: @test1(
+; CHECK:    for.body:
+; CHECK:    [[INDVARS_IV16:%.*]] = phi i64 [ [[TMP1:%.*]], [[FOR_BODY_LR_PH:%.*]] ], [ [[INDVARS_IV_NEXT17:%.*]], [[FOR_INC7:%.*]] ]
+; CHECK:    [[OR12:%.*]] = phi i32 [ [[OR:%.*]], [[FOR_INC7]] ], [ [[OR_LCSSA15:%.*]], [[FOR_BODY_LR_PH]] ]
+; CHECK:    for.body3:
+; CHECK:    [[INDVARS_IV:%.*]] = phi i64 [ [[TMP6:%.*]], [[FOR_BODY3_SPLIT:%.*]] ], [ 5, [[FOR_BODY3_PREHEADER:%.*]] ]
+; CHECK:    [[DEC11:%.*]] = phi i32 [ [[TMP7:%.*]], [[FOR_BODY3_SPLIT]] ], [ 5, [[FOR_BODY3_PREHEADER]] ]
+; CHECK:    [[OR_LCSSA15]] = phi i32 [ [[A_PROMOTED14:%.*]], [[FOR_BODY3_PREHEADER]] ], [ [[OR_LCSSA:%.*]], [[FOR_BODY3_SPLIT]] ]
+; CHECK:    for.body3.split:
+; CHECK:    [[OR_LCSSA]] = phi i32 [ [[OR]], [[FOR_INC7]] ]
+; CHECK:    [[TMP7]] = add nsw i32 [[DEC11]], -1
+; CHECK:    [[TMP8:%.*]] = icmp eq i32 [[TMP7]], 0
+; CHECK:    for.inc7:
+; CHECK:    [[INDVARS_IV_NEXT17]] = add nsw i64 [[INDVARS_IV16]], 1
+; CHECK:    for.cond.for.end8_crit_edge:
+; CHECK:    [[OR_LCSSA_LCSSA:%.*]] = phi i32 [ [[OR_LCSSA]], [[FOR_BODY3_SPLIT]] ]
+; CHECK:    for.end8:
+; CHECK:    ret void
+;
+entry:
+  %.pr = load i32, i32* @c, align 4
+  %tobool10 = icmp eq i32 %.pr, 0
+  br i1 %tobool10, label %for.end8, label %for.body.lr.ph
+
+for.body.lr.ph:                                   ; preds = %entry
+  %a.promoted14 = load i32, i32* @a, align 4
+  %0 = sext i32 %.pr to i64
+  %1 = sub i32 -1, %.pr
+  %2 = zext i32 %1 to i64
+  %3 = add i64 %0, %2
+  br label %for.body
+
+for.body:                                         ; preds = %for.body.lr.ph, %for.inc7
+  %indvars.iv16 = phi i64 [ %0, %for.body.lr.ph ], [ %indvars.iv.next17, %for.inc7 ]
+  %or.lcssa15 = phi i32 [ %a.promoted14, %for.body.lr.ph ], [ %or.lcssa, %for.inc7 ]
+  %4 = add nsw i64 %indvars.iv16, 9
+  br label %for.body3
+
+for.body3:                                        ; preds = %for.body, %for.body3
+  %or12 = phi i32 [ %or.lcssa15, %for.body ], [ %or, %for.body3 ]
+  %indvars.iv = phi i64 [ 5, %for.body ], [ %indvars.iv.next, %for.body3 ]
+  %dec11 = phi i32 [ 5, %for.body ], [ %dec, %for.body3 ]
+  %arrayidx5 = getelementptr inbounds [200 x [200 x i32]], [200 x [200 x i32]]* @b, i64 0, i64 %indvars.iv, i64 %4
+  %5 = load i32, i32* %arrayidx5, align 4
+  %or = or i32 %or12, %5  
+  %indvars.iv.next = add nsw i64 %indvars.iv, -1
+  %dec = add nsw i32 %dec11, -1
+  %tobool2 = icmp eq i32 %dec, 0
+  br i1 %tobool2, label %for.inc7, label %for.body3
+
+for.inc7:                                         ; preds = %for.body3
+  %or.lcssa = phi i32 [ %or, %for.body3 ]
+  %indvars.iv.next17 = add nsw i64 %indvars.iv16, 1
+  %6 = trunc i64 %indvars.iv.next17 to i32
+  %tobool = icmp eq i32 %6, 0
+  br i1 %tobool, label %for.cond.for.end8_crit_edge, label %for.body
+
+for.cond.for.end8_crit_edge:                      ; preds = %for.inc7
+  %or.lcssa.lcssa = phi i32 [ %or.lcssa, %for.inc7 ]
+  %dec6.lcssa.lcssa = phi i32 [ 0, %for.inc7 ]
+  %7 = add i64 %3, 1
+  %8 = trunc i64 %7 to i32
+  store i32 0, i32* @d, align 4
+  store i32 %dec6.lcssa.lcssa, i32* @e, align 4
+  store i32 %or.lcssa.lcssa, i32* @a, align 4
+  store i32 %8, i32* @c, align 4
+  br label %for.end8
+
+for.end8:                                         ; preds = %for.cond.for.end8_crit_edge, %entry
+  ret void
+}
+
+;; int a, c, d, e;
+;; int b[200][200];
+;; void fn1() {
+;;   for (; c; c++) {
+;;     d = 5;
+;;     e = 6;
+;;     for (; d+e>0; d--, e=e-2)
+;;       a |= b[d][c + 9];
+;;   }
+;; }
+;
+; All inner loop indvars are used in the inner latch.
+;
+define void @test2() {
+; CHECK-LABEL: @test2(
+; CHECK:    for.body:
+; CHECK:    [[INDVARS_IV16:%.*]] = phi i64 [ [[TMP1:%.*]], [[FOR_BODY_LR_PH:%.*]] ], [ [[INDVARS_IV_NEXT17:%.*]], [[FOR_INC7:%.*]] ]
+; CHECK:    [[OR12:%.*]] = phi i32 [ [[OR:%.*]], [[FOR_INC7]] ], [ [[OR_LCSSA15:%.*]], [[FOR_BODY_LR_PH]] ]
+; CHECK:    [[TMP0:%.*]] = add nsw i64 [[INDVARS_IV16]], 9
+; CHECK:    for.body3:
+; CHECK:    [[INDVARS_IV:%.*]] = phi i64 [ [[TMP7:%.*]], [[FOR_BODY3_SPLIT:%.*]] ], [ 5, [[FOR_BODY3_PREHEADER]] ]
+; CHECK:    [[DEC11:%.*]] = phi i32 [ [[TMP6:%.*]], [[FOR_BODY3_SPLIT]] ], [ 6, [[FOR_BODY3_PREHEADER]] ]
+; CHECK:    [[OR_LCSSA15]] = phi i32 [ [[A_PROMOTED14]], [[FOR_BODY3_PREHEADER]] ], [ [[OR_LCSSA:%.*]], [[FOR_BODY3_SPLIT]] ]
+; CHECK:    for.body3.split1:
+; CHECK:    [[ARRAYIDX5:%.*]] = getelementptr inbounds [200 x [200 x i32]], [200 x [200 x i32]]* @b, i64 0, i64 [[INDVARS_IV]], i64 [[TMP0]]
+; CHECK:    [[TMP5:%.*]] = load i32, i32* [[ARRAYIDX5]], align 4
+; CHECK:    [[OR]] = or i32 [[OR12]], [[TMP5]]
+; CHECK:    for.body3.split:
+; CHECK:    [[OR_LCSSA]] = phi i32 [ [[OR]], [[FOR_INC7]] ]
+; CHECK:    [[TMP6]] = add nsw i32 [[DEC11]], -2
+; CHECK:    [[TMP7:%.*]] = sext i32 [[TMP6]] to i64
+; CHECK:    [[TMP8]] = add nsw i64 [[INDVARS_IV]], -1
+; CHECK:    [[TMP9:%.*]] = add nsw i64 [[TMP8]], [[TMP7]]
+; CHECK:    [[TMP10:%.*]] = icmp eq i64 [[TMP9]], 0
+; CHECK:    for.inc7:
+; CHECK:    [[INDVARS_IV_NEXT17]] = add nsw i64 [[INDVARS_IV16]], 1
+; CHECK:    for.cond.for.end8_crit_edge:
+; CHECK:    [[OR_LCSSA_LCSSA:%.*]] = phi i32 [ [[OR_LCSSA]], [[FOR_BODY3_SPLIT]] ]
+; CHECK:    for.end8:
+; CHECK:    ret void
+;
+entry:
+  %.pr = load i32, i32* @c, align 4
+  %tobool10 = icmp eq i32 %.pr, 0
+  br i1 %tobool10, label %for.end8, label %for.body.lr.ph
+
+for.body.lr.ph:                                   ; preds = %entry
+  %a.promoted14 = load i32, i32* @a, align 4
+  %0 = sext i32 %.pr to i64
+  %1 = sub i32 -1, %.pr
+  %2 = zext i32 %1 to i64
+  %3 = add i64 %0, %2
+  br label %for.body
+
+for.body:                                         ; preds = %for.body.lr.ph, %for.inc7
+  %indvars.iv16 = phi i64 [ %0, %for.body.lr.ph ], [ %indvars.iv.next17, %for.inc7 ]
+  %or.lcssa15 = phi i32 [ %a.promoted14, %for.body.lr.ph ], [ %or.lcssa, %for.inc7 ]
+  %4 = add nsw i64 %indvars.iv16, 9
+  br label %for.body3
+
+for.body3:                                        ; preds = %for.body, %for.body3
+  %or12 = phi i32 [ %or.lcssa15, %for.body ], [ %or, %for.body3 ]
+  %indvars.iv = phi i64 [ 5, %for.body ], [ %indvars.iv.next, %for.body3 ]
+  %dec11 = phi i32 [ 6, %for.body ], [ %dec, %for.body3 ]
+  %arrayidx5 = getelementptr inbounds [200 x [200 x i32]], [200 x [200 x i32]]* @b, i64 0, i64 %indvars.iv, i64 %4
+  %5 = load i32, i32* %arrayidx5, align 4
+  %or = or i32 %or12, %5
+  %indvars.iv.next = add nsw i64 %indvars.iv, -1
+  %dec = add nsw i32 %dec11, -2    
+  %dec.ext = sext i32 %dec to i64
+  %indvars.add = add nsw i64 %indvars.iv.next, %dec.ext
+  %tobool2 = icmp eq i64 %indvars.add, 0
+  br i1 %tobool2, label %for.inc7, label %for.body3
+
+for.inc7:                                         ; preds = %for.body3
+  %or.lcssa = phi i32 [ %or, %for.body3 ]
+  %indvars.iv.next17 = add nsw i64 %indvars.iv16, 1
+  %6 = trunc i64 %indvars.iv.next17 to i32
+  %tobool = icmp eq i32 %6, 0
+  br i1 %tobool, label %for.cond.for.end8_crit_edge, label %for.body
+
+for.cond.for.end8_crit_edge:                      ; preds = %for.inc7
+  %or.lcssa.lcssa = phi i32 [ %or.lcssa, %for.inc7 ]
+  %dec6.lcssa.lcssa = phi i32 [ 0, %for.inc7 ]
+  %7 = add i64 %3, 1
+  %8 = trunc i64 %7 to i32
+  store i32 0, i32* @d, align 4
+  store i32 %dec6.lcssa.lcssa, i32* @e, align 4
+  store i32 %or.lcssa.lcssa, i32* @a, align 4
+  store i32 %8, i32* @c, align 4
+  br label %for.end8
+
+for.end8:                                         ; preds = %for.cond.for.end8_crit_edge, %entry
+  ret void
+}
+
+;; int a, c, d, e;
+;; int b[200][200];
+;; void fn1() {
+;;   for (; c; c++) {
+;;     d = 5;
+;;     e = 49;
+;;     for (; d != e; d++, e--)
+;;       a |= b[d][c + 9];
+;;   }
+;; }
+;
+; Two inner loop indvars are involved in the inner loop exit
+; condition as LHS and RHS.
+define void @test3() {
+; CHECK-LABEL: @test3(
+; CHECK:    for.body:
+; CHECK:    [[INDVARS_IV16:%.*]] = phi i64 [ [[TMP1:%.*]], [[FOR_BODY_LR_PH:%.*]] ], [ [[INDVARS_IV_NEXT17:%.*]], [[FOR_INC7:%.*]] ]
+; CHECK:    [[OR12:%.*]] = phi i32 [ [[OR:%.*]], [[FOR_INC7]] ], [ [[OR_LCSSA15:%.*]], [[FOR_BODY_LR_PH]] ]
+; CHECK:    [[TMP0:%.*]] = add nsw i64 [[INDVARS_IV16]], 9
+; CHECK:    for.body3:
+; CHECK:    [[INDVARS_IV:%.*]] = phi i32 [ [[TMP7:%.*]], [[FOR_BODY3_SPLIT:%.*]] ], [ 5, [[FOR_BODY3_PREHEADER]] ]
+; CHECK:    [[DEC11:%.*]] = phi i32 [ [[TMP6:%.*]], [[FOR_BODY3_SPLIT]] ], [ 49, [[FOR_BODY3_PREHEADER]] ]
+; CHECK:    [[OR_LCSSA15]] = phi i32 [ [[A_PROMOTED14]], [[FOR_BODY3_PREHEADER]] ], [ [[OR_LCSSA:%.*]], [[FOR_BODY3_SPLIT]] ]
+; CHECK:    for.body3.split1:
+; CHECK:    [[ARRAYIDX5:%.*]] = getelementptr inbounds [200 x [200 x i32]], [200 x [200 x i32]]* @b, i64 0, i32 [[INDVARS_IV]], i64 [[TMP0]]
+; CHECK:    [[TMP5:%.*]] = load i32, i32* [[ARRAYIDX5]], align 4
+; CHECK:    [[OR]] = or i32 [[OR12]], [[TMP5]]
+; CHECK:    for.body3.split:
+; CHECK:    [[OR_LCSSA]] = phi i32 [ [[OR]], [[FOR_INC7]] ]
+; CHECK:    [[TMP6]] = add nsw i32 [[DEC11]], -1
+; CHECK:    [[TMP7]] = add nsw i32 [[INDVARS_IV]], 1
+; CHECK:    [[TMP8:%.*]] = icmp eq i32 [[TMP7]], [[TMP6]]
+; CHECK:    for.inc7:
+; CHECK:    [[INDVARS_IV_NEXT17]] = add nsw i64 [[INDVARS_IV16]], 1
+; CHECK:    for.cond.for.end8_crit_edge:
+; CHECK:    [[OR_LCSSA_LCSSA:%.*]] = phi i32 [ [[OR_LCSSA]], [[FOR_BODY3_SPLIT]] ]
+; CHECK:    for.end8:
+; CHECK:    ret void
+;
+entry:
+  %.pr = load i32, i32* @c, align 4
+  %tobool10 = icmp eq i32 %.pr, 0
+  br i1 %tobool10, label %for.end8, label %for.body.lr.ph
+
+for.body.lr.ph:                                   ; preds = %entry
+  %a.promoted14 = load i32, i32* @a, align 4
+  %0 = sext i32 %.pr to i64
+  %1 = sub i32 -1, %.pr
+  %2 = zext i32 %1 to i64
+  %3 = add i64 %0, %2
+  br label %for.body
+
+for.body:                                         ; preds = %for.body.lr.ph, %for.inc7
+  %indvars.iv16 = phi i64 [ %0, %for.body.lr.ph ], [ %indvars.iv.next17, %for.inc7 ]
+  %or.lcssa15 = phi i32 [ %a.promoted14, %for.body.lr.ph ], [ %or.lcssa, %for.inc7 ]
+  %4 = add nsw i64 %indvars.iv16, 9
+  br label %for.body3
+
+for.body3:                                        ; preds = %for.body, %for.body3
+  %or12 = phi i32 [ %or.lcssa15, %for.body ], [ %or, %for.body3 ]
+  %indvars.iv = phi i32 [ 5, %for.body ], [ %indvars.iv.next, %for.body3 ]
+  %dec11 = phi i32 [ 49, %for.body ], [ %dec, %for.body3 ]
+  %arrayidx5 = getelementptr inbounds [200 x [200 x i32]], [200 x [200 x i32]]* @b, i64 0, i32 %indvars.iv, i64 %4
+  %5 = load i32, i32* %arrayidx5, align 4
+  %or = or i32 %or12, %5
+  %indvars.iv.next = add nsw i32 %indvars.iv, 1
+  %dec = add nsw i32 %dec11, -1
+  %tobool2 = icmp eq i32 %indvars.iv.next, %dec
+  br i1 %tobool2, label %for.inc7, label %for.body3
+
+for.inc7:                                         ; preds = %for.body3
+  %or.lcssa = phi i32 [ %or, %for.body3 ]
+  %indvars.iv.next17 = add nsw i64 %indvars.iv16, 1
+  %6 = trunc i64 %indvars.iv.next17 to i32
+  %tobool = icmp eq i32 %6, 0
+  br i1 %tobool, label %for.cond.for.end8_crit_edge, label %for.body
+
+for.cond.for.end8_crit_edge:                      ; preds = %for.inc7
+  %or.lcssa.lcssa = phi i32 [ %or.lcssa, %for.inc7 ]
+  %dec6.lcssa.lcssa = phi i32 [ 0, %for.inc7 ]
+  %7 = add i64 %3, 1
+  %8 = trunc i64 %7 to i32
+  store i32 0, i32* @d, align 4
+  store i32 %dec6.lcssa.lcssa, i32* @e, align 4
+  store i32 %or.lcssa.lcssa, i32* @a, align 4
+  store i32 %8, i32* @c, align 4
+  br label %for.end8
+
+for.end8:                                         ; preds = %for.cond.for.end8_crit_edge, %entry
+  ret void
+}
\ No newline at end of file