Index: lib/Analysis/InlineCost.cpp =================================================================== --- lib/Analysis/InlineCost.cpp +++ lib/Analysis/InlineCost.cpp @@ -206,6 +206,8 @@ bool visitCastInst(CastInst &I); bool visitUnaryInstruction(UnaryInstruction &I); bool visitCmpInst(CmpInst &I); + bool visitAnd(BinaryOperator &I); + bool visitOr(BinaryOperator &I); bool visitSub(BinaryOperator &I); bool visitBinaryOperator(BinaryOperator &I); bool visitLoad(LoadInst &I); @@ -784,6 +786,42 @@ return false; } +bool CallAnalyzer::visitOr(BinaryOperator &I) { + // See if we can simplify a logical 'or'. If either operand simplifies to + // true, the 'or' simplifies to true. This is necessary because the generic + // simplify instruction only works if both operands are constants. + if (I.getType()->isIntegerTy(1)) { + for (unsigned i = 0; i < 2; ++i) { + Value *Op = I.getOperand(i); + if (ConstantInt *C = + dyn_cast_or_null(SimplifiedValues.lookup(Op))) + if (C->isOne()) { + SimplifiedValues[&I] = C; + return true; + } + } + } + return Base::visitOr(I); +} + +bool CallAnalyzer::visitAnd(BinaryOperator &I) { + // See if we can simplify a logical 'and'. If either operand simplifies to + // false, the 'and' simplifies to false. This is necessary because the + // generic simplify instruction only works if both operands are constants. + if (I.getType()->isIntegerTy(1)) { + for (unsigned i = 0; i < 2; ++i) { + Value *Op = I.getOperand(i); + if (ConstantInt *C = + dyn_cast_or_null(SimplifiedValues.lookup(Op))) + if (C->isZero()) { + SimplifiedValues[&I] = C; + return true; + } + } + } + return Base::visitAnd(I); +} + bool CallAnalyzer::visitSub(BinaryOperator &I) { // Try to handle a special case: we can fold computing the difference of two // constant-related pointers. Index: test/Transforms/Inline/AArch64/logical-and-or.ll =================================================================== --- /dev/null +++ test/Transforms/Inline/AArch64/logical-and-or.ll @@ -0,0 +1,66 @@ +; REQUIRES: asserts +; RUN: opt -inline -mtriple=aarch64--linux-gnu -S -debug-only=inline-cost < %s 2>&1 | FileCheck %s + +target datalayout = "e-m:e-i8:8:32-i16:16:32-i64:64-i128:128-n32:64-S128" +target triple = "aarch64--linux-gnu" + +; FIXME: Once the 'or' or 'and' is simplified the second compare is dead, but +; the inline cost model has already added the cost. + +define i1 @outer1(i32 %a) { + %C = call i1 @inner1(i32 0, i32 %a) + ret i1 %C +} + +; CHECK: Analyzing call of inner1 +; CHECK: NumInstructionsSimplified: 3 +; CHECK: NumInstructions: 4 +define i1 @inner1(i32 %a, i32 %b) { + %tobool = icmp eq i32 %a, 0 ; Simplifies to true + %tobool1 = icmp eq i32 %b, 0 ; Should be dead once 'or' is simplified + %or.cond = or i1 %tobool, %tobool1 ; Simplifies to true + ret i1 %or.cond ; Simplifies to ret i1 true +} + +define i1 @outer2(i32 %a) { + %C = call i1 @inner2(i32 1, i32 %a) + ret i1 %C +} + +; CHECK: Analyzing call of inner2 +; CHECK: NumInstructionsSimplified: 3 +; CHECK: NumInstructions: 4 +define i1 @inner2(i32 %a, i32 %b) { + %tobool = icmp eq i32 %a, 0 ; Simplifies to false + %tobool1 = icmp eq i32 %b, 0 ; Should be dead once 'and' is simplified + %and.cond = and i1 %tobool, %tobool1 ; Simplifies to false + ret i1 %and.cond ; Simplifies to ret i1 false +} + +define i1 @outer3(i32 %a) { + %C = call i1 @inner3(i32 0, i32 %a) + ret i1 %C +} + +; CHECK: Analyzing call of inner3 +; CHECK: NumInstructionsSimplified: 3 +; CHECK: NumInstructions: 4 +define i1 @inner3(i32 %a, i32 %b) { + %tobool = icmp eq i32 %a, 0 ; Simplifies to true + %tobool1 = icmp eq i32 %b, 0 ; Should be dead once 'or' is simplified + %or.cond = or i1 %tobool, %tobool1 ; Simplifies to true + br i1 %or.cond, label %end, label %isfalse ; Simplifies to br label %end + +isfalse: ; This block is unreachable once inlined + call void @dead() + call void @dead() + call void @dead() + call void @dead() + call void @dead() + br label %end + +end: + ret i1 %or.cond ; Simplifies to ret i1 true +} + +declare void @dead()