Index: lib/Target/PowerPC/PPC.h =================================================================== --- lib/Target/PowerPC/PPC.h +++ lib/Target/PowerPC/PPC.h @@ -44,7 +44,7 @@ FunctionPass *createPPCQPXLoadSplatPass(); FunctionPass *createPPCISelDag(PPCTargetMachine &TM); FunctionPass *createPPCTLSDynamicCallPass(); - FunctionPass *createPPCBoolRetToIntPass(); + FunctionPass *createPPCBoolRetToIntPass(PPCTargetMachine &TM); FunctionPass *createPPCExpandISELPass(); void LowerPPCMachineInstrToMCInst(const MachineInstr *MI, MCInst &OutMI, AsmPrinter &AP, bool isDarwin); Index: lib/Target/PowerPC/PPCBoolRetToInt.cpp =================================================================== --- lib/Target/PowerPC/PPCBoolRetToInt.cpp +++ lib/Target/PowerPC/PPCBoolRetToInt.cpp @@ -33,6 +33,7 @@ //===----------------------------------------------------------------------===// #include "PPC.h" +#include "PPCTargetMachine.h" #include "llvm/ADT/DenseMap.h" #include "llvm/ADT/SmallPtrSet.h" #include "llvm/ADT/SmallVector.h" @@ -88,16 +89,19 @@ } // Translate a i1 value to an equivalent i32 value: - static Value *translate(Value *V) { - Type *Int32Ty = Type::getInt32Ty(V->getContext()); + Value *translate(Value *V) { + Type *IntTy = Type::getInt32Ty(V->getContext()); + if (ST && ST->isPPC64()) + IntTy = Type::getInt64Ty(V->getContext()); + if (auto *C = dyn_cast(V)) - return ConstantExpr::getZExt(C, Int32Ty); + return ConstantExpr::getZExt(C, IntTy); if (auto *P = dyn_cast(V)) { // Temporarily set the operands to 0. We'll fix this later in // runOnUse. - Value *Zero = Constant::getNullValue(Int32Ty); + Value *Zero = Constant::getNullValue(IntTy); PHINode *Q = - PHINode::Create(Int32Ty, P->getNumIncomingValues(), P->getName(), P); + PHINode::Create(IntTy, P->getNumIncomingValues(), P->getName(), P); for (unsigned i = 0; i < P->getNumOperands(); ++i) Q->addIncoming(Zero, P->getIncomingBlock(i)); return Q; @@ -109,7 +113,7 @@ auto InstPt = A ? &*A->getParent()->getEntryBlock().begin() : I->getNextNode(); - return new ZExtInst(V, Int32Ty, "", InstPt); + return new ZExtInst(V, IntTy, "", InstPt); } typedef SmallPtrSet PHINodeSet; @@ -177,7 +181,11 @@ public: static char ID; - PPCBoolRetToInt() : FunctionPass(ID) { + PPCBoolRetToInt() : FunctionPass(ID), TM(nullptr) { + initializePPCBoolRetToIntPass(*PassRegistry::getPassRegistry()); + } + + PPCBoolRetToInt(PPCTargetMachine &TM) : FunctionPass(ID), TM(&TM) { initializePPCBoolRetToIntPass(*PassRegistry::getPassRegistry()); } @@ -185,6 +193,10 @@ if (skipFunction(F)) return false; + ST = nullptr; + if (TM) + ST = TM->getSubtargetImpl(F); + PHINodeSet PromotablePHINodes = getPromotablePHINodes(F); B2IMap Bool2IntMap; bool Changed = false; @@ -205,7 +217,7 @@ return Changed; } - static bool runOnUse(Use &U, const PHINodeSet &PromotablePHINodes, + bool runOnUse(Use &U, const PHINodeSet &PromotablePHINodes, B2IMap &BoolToIntMap) { auto Defs = findAllDefs(U); @@ -262,6 +274,10 @@ AU.addPreserved(); FunctionPass::getAnalysisUsage(AU); } + +private: + const PPCSubtarget *ST; + PPCTargetMachine *TM; }; } // end anonymous namespace @@ -271,4 +287,6 @@ "Convert i1 constants to i32 if they are returned", false, false) -FunctionPass *llvm::createPPCBoolRetToIntPass() { return new PPCBoolRetToInt(); } +FunctionPass *llvm::createPPCBoolRetToIntPass(PPCTargetMachine &TM) { + return new PPCBoolRetToInt(TM); +} Index: lib/Target/PowerPC/PPCTargetMachine.cpp =================================================================== --- lib/Target/PowerPC/PPCTargetMachine.cpp +++ lib/Target/PowerPC/PPCTargetMachine.cpp @@ -323,7 +323,7 @@ void PPCPassConfig::addIRPasses() { if (TM->getOptLevel() != CodeGenOpt::None) - addPass(createPPCBoolRetToIntPass()); + addPass(createPPCBoolRetToIntPass(getPPCTargetMachine())); addPass(createAtomicExpandPass(&getPPCTargetMachine())); // For the BG/Q (or if explicitly requested), add explicit data prefetch Index: test/CodeGen/PowerPC/pr32442.ll =================================================================== --- test/CodeGen/PowerPC/pr32442.ll +++ test/CodeGen/PowerPC/pr32442.ll @@ -0,0 +1,18 @@ +; RUN: llc -mtriple=powerpc64le-linux-gnu -mcpu=pwr8 < %s | FileCheck %s + +; CHECK-NOT: clrldi + +define zeroext i1 @foo(i32 signext %i, i32* %p) { +entry: + %cmp = icmp eq i32 %i, 0 + br i1 %cmp, label %return, label %if.end + +if.end: + store i32 %i, i32* %p, align 4 + br label %return + +return: + %retval = phi i1 [ true, %if.end ], [ false, %entry ] + ret i1 %retval +} +