Index: lib/Transforms/Coroutines/CoroEarly.cpp =================================================================== --- lib/Transforms/Coroutines/CoroEarly.cpp +++ lib/Transforms/Coroutines/CoroEarly.cpp @@ -28,7 +28,6 @@ public: Lowerer(Module &M) : LowererBase(M) {} - static std::unique_ptr createIfNeeded(Module &M); bool lowerEarlyIntrinsics(Function &F); }; } @@ -67,15 +66,6 @@ return Changed; } -// This pass has work to do only if we find intrinsics we are going to lower in -// the module. -std::unique_ptr Lowerer::createIfNeeded(Module &M) { - if (declaresIntrinsics(M, {"llvm.coro.resume", "llvm.coro.destroy"})) - return llvm::make_unique(M); - - return {}; -} - //===----------------------------------------------------------------------===// // Top Level Driver //===----------------------------------------------------------------------===// @@ -88,8 +78,11 @@ std::unique_ptr L; + // This pass has work to do only if we find intrinsics we are going to lower + // in the module. bool doInitialization(Module &M) override { - L = Lowerer::createIfNeeded(M); + if (coro::declaresIntrinsics(M, {"llvm.coro.resume", "llvm.coro.destroy"})) + L = llvm::make_unique(M); return false; } @@ -104,7 +97,6 @@ AU.setPreservesCFG(); } }; - } char CoroEarly::ID = 0; Index: lib/Transforms/Coroutines/CoroElide.cpp =================================================================== --- lib/Transforms/Coroutines/CoroElide.cpp +++ lib/Transforms/Coroutines/CoroElide.cpp @@ -13,6 +13,8 @@ #include "CoroInternal.h" #include "llvm/Analysis/AliasAnalysis.h" +#include "llvm/IR/ConstantFolder.h" +#include "llvm/IR/InstIterator.h" #include "llvm/Pass.h" using namespace llvm; @@ -24,16 +26,110 @@ //===----------------------------------------------------------------------===// namespace { - struct CoroElide : FunctionPass { static char ID; CoroElide() : FunctionPass(ID) {} - bool runOnFunction(Function &F) override { return false; } + + bool NeedsToRun = false; + + bool doInitialization(Module &M) override { + NeedsToRun = coro::declaresIntrinsics(M, {"llvm.coro.begin"}); + return false; + } + + bool runOnFunction(Function &F) override; void getAnalysisUsage(AnalysisUsage &AU) const override { - AU.setPreservesAll(); + AU.setPreservesCFG(); } }; +} +// Go through the list of coro.subfn.addr intrinsics and replace them with the +// provided constant. +static void replaceWithConstant(Constant *Value, + SmallVectorImpl &Users) { + if (Users.empty()) + return; + + // See if we need to bitcast the constant to match the type of the intrinsic + // being replaced. Note: All coro.subfn.addr intrinsics return the same type, + // so we only need to examine the type of the first one in the list. + Type *IntrTy = Users.front()->getType(); + Type *ValueTy = Value->getType(); + if (ValueTy != IntrTy) { + // May need to tweak the function type to match the type expected at the + // use site. + assert(ValueTy->isPointerTy() && IntrTy->isPointerTy()); + Value = ConstantExpr::getBitCast(Value, IntrTy); + } + + // Now the value type matches the type of the intrinsic. Go ahead and replace. + for (CoroSubFnInst *I : Users) { + I->replaceAllUsesWith(Value); + I->eraseFromParent(); + } + + // Propagate the constant to turn the indirect call into a direct call, so + // that CGPassManager recognizes the change as devirtualization. + coro::constantFoldUsers(Value); +} + +// See if there are any coro.subfn.addr intrinsics directly referencing +// the coro.begin. If found, replace them with an appropriate coroutine +// subfunction associated with that coro.begin. +static bool replaceIndirectCalls(CoroBeginInst *CoroBegin) { + SmallVector ResumeAddr; + SmallVector DestroyAddr; + + for (User *U : CoroBegin->users()) { + if (auto *II = dyn_cast(U)) { + switch (II->getIndex()) { + case CoroSubFnInst::ResumeIndex: + ResumeAddr.push_back(II); + break; + case CoroSubFnInst::DestroyIndex: + DestroyAddr.push_back(II); + break; + default: + llvm_unreachable("unexpected coro.subfn.addr constant"); + } + } + } + if (ResumeAddr.empty() && DestroyAddr.empty()) + return false; + + // PostSplit coro.begin refers to an array of subfunctions in its Info + // argument. + ConstantArray *Resumers = CoroBegin->getInfo().Resumers; + assert(Resumers && "PostSplit coro.begin Info argument must refer to an array" + "of coroutine subfunctions"); + auto *ResumeAddrConstant = + ConstantFolder().CreateExtractValue(Resumers, CoroSubFnInst::ResumeIndex); + auto *DestroyAddrConstant = ConstantFolder().CreateExtractValue( + Resumers, CoroSubFnInst::DestroyIndex); + + replaceWithConstant(ResumeAddrConstant, ResumeAddr); + replaceWithConstant(DestroyAddrConstant, DestroyAddr); + return true; +} + +bool CoroElide::runOnFunction(Function &F) { + // Collect all PostSplit coro.begins. + SmallVector CoroBegins; + for (auto &I : instructions(F)) + if (auto *CB = dyn_cast(&I)) + if (CB->getInfo().isPostSplit()) + CoroBegins.push_back(CB); + + if (CoroBegins.empty()) + return false; + + bool Changed = false; + + for (auto *CB : CoroBegins) + Changed |= replaceIndirectCalls(CB); + + return Changed; } char CoroElide::ID = 0; Index: lib/Transforms/Coroutines/CoroInstr.h =================================================================== --- lib/Transforms/Coroutines/CoroInstr.h +++ lib/Transforms/Coroutines/CoroInstr.h @@ -61,4 +61,58 @@ } }; +/// This class represents the llvm.coro.begin instruction. +class LLVM_LIBRARY_VISIBILITY CoroBeginInst : public IntrinsicInst { + enum { MemArg, AlignArg, PromiseArg, InfoArg }; + +public: + Constant *getRawInfo() const { + return cast(getArgOperand(InfoArg)->stripPointerCasts()); + } + + void setInfo(Constant *C) { setArgOperand(InfoArg, C); } + + // Info argument of coro.begin is + // fresh out of the front: null ; + // outlined : {Init, Return, Susp1, Susp2, ...} ; + // postsplit : [resume, destroy, cleanup] ; + // + // If parts of the coroutine were outlined to protect against undesirable + // code motion, these functions will be stored in a struct literal referred to + // by the Info parameter. Note: this is only needed before coroutine is split. + // + // After coroutine is split, resume functions are stored in an array constant + // refered by this parameter. + + struct Info { + ConstantStruct *OutlinedParts = nullptr; + ConstantArray *Resumers = nullptr; + + bool hasOutlinedParts() const { return OutlinedParts != nullptr; } + bool isPostSplit() const { return Resumers != nullptr; } + }; + Info getInfo() const { + Info Result; + auto *GV = dyn_cast(getRawInfo()); + if (!GV) + return Result; + + assert(GV->isConstant() && GV->hasDefinitiveInitializer()); + Constant *Initializer = GV->getInitializer(); + if ((Result.OutlinedParts = dyn_cast(Initializer))) + return Result; + + Result.Resumers = cast(Initializer); + return Result; + } + + // Methods for support type inquiry through isa, cast, and dyn_cast: + static inline bool classof(const IntrinsicInst *I) { + return I->getIntrinsicID() == Intrinsic::coro_begin; + } + static inline bool classof(const Value *V) { + return isa(V) && classof(cast(V)); + } +}; + } // End namespace llvm. Index: lib/Transforms/Coroutines/CoroInternal.h =================================================================== --- lib/Transforms/Coroutines/CoroInternal.h +++ lib/Transforms/Coroutines/CoroInternal.h @@ -17,9 +17,6 @@ namespace llvm { -class FunctionType; -class LLVMContext; -class Module; class PassRegistry; void initializeCoroEarlyPass(PassRegistry &); @@ -29,6 +26,9 @@ namespace coro { +void constantFoldUsers(Constant *Value); +bool declaresIntrinsics(Module &M, std::initializer_list); + // Keeps data and helper functions for lowering coroutine intrinsics. struct LowererBase { Module &TheModule; @@ -37,7 +37,6 @@ LowererBase(Module &M); Value *makeSubFnCall(Value *Arg, int Index, Instruction *InsertPt); - static bool declaresIntrinsics(Module &M, std::initializer_list); }; } // End namespace coro. Index: lib/Transforms/Coroutines/Coroutines.cpp =================================================================== --- lib/Transforms/Coroutines/Coroutines.cpp +++ lib/Transforms/Coroutines/Coroutines.cpp @@ -10,6 +10,7 @@ //===----------------------------------------------------------------------===// #include "CoroInternal.h" +#include "llvm/Analysis/ConstantFolding.h" #include "llvm/IR/LegacyPassManager.h" #include "llvm/IR/Verifier.h" #include "llvm/InitializePasses.h" @@ -95,23 +96,48 @@ return Bitcast; } +void coro::constantFoldUsers(Constant *Value) { + SmallPtrSet WorkList; + for (User *U : Value->users()) + WorkList.insert(cast(U)); + + if (WorkList.empty()) + return; + + Instruction *FirstInstr = *WorkList.begin(); + Function *F = FirstInstr->getParent()->getParent(); + const DataLayout &DL = F->getParent()->getDataLayout(); + + do { + Instruction *I = *WorkList.begin(); + WorkList.erase(I); // Get an element from the worklist... + + if (!I->use_empty()) // Don't muck with dead instructions... + if (Constant *C = ConstantFoldInstruction(I, DL)) { + // Add all of the users of this instruction to the worklist, they might + // be constant propagatable now... + for (User *U : I->users()) + WorkList.insert(cast(U)); + + // Replace all of the uses of a variable with uses of the constant. + I->replaceAllUsesWith(C); + + // Remove the dead instruction. + WorkList.erase(I); + I->eraseFromParent(); + } + } while (!WorkList.empty()); +} + #ifndef NDEBUG static bool isCoroutineIntrinsicName(StringRef Name) { // NOTE: Must be sorted! static const char *const CoroIntrinsics[] = { - "llvm.coro.alloc", - "llvm.coro.begin", - "llvm.coro.destroy", - "llvm.coro.done", - "llvm.coro.end", - "llvm.coro.frame", - "llvm.coro.free", - "llvm.coro.param", - "llvm.coro.promise", - "llvm.coro.resume", - "llvm.coro.save", - "llvm.coro.size", - "llvm.coro.suspend", + "llvm.coro.alloc", "llvm.coro.begin", "llvm.coro.destroy", + "llvm.coro.done", "llvm.coro.end", "llvm.coro.frame", + "llvm.coro.free", "llvm.coro.param", "llvm.coro.promise", + "llvm.coro.resume", "llvm.coro.save", "llvm.coro.size", + "llvm.coro.suspend", }; return Intrinsic::lookupLLVMIntrinsicByName(CoroIntrinsics, Name) != -1; } @@ -119,8 +145,8 @@ // Verifies if a module has named values listed. Also, in debug mode verifies // that names are intrinsic names. -bool coro::LowererBase::declaresIntrinsics( - Module &M, std::initializer_list List) { +bool coro::declaresIntrinsics(Module &M, + std::initializer_list List) { for (StringRef Name : List) { assert(isCoroutineIntrinsicName(Name) && "not a coroutine intrinsic"); Index: test/Transforms/Coroutines/coro-elide.ll =================================================================== --- /dev/null +++ test/Transforms/Coroutines/coro-elide.ll @@ -0,0 +1,96 @@ +; Tests that the coro.destroy and coro.resume are devirtualized where possible, +; SCC pipeline restarts and inlines the direct calls. +; RUN: opt < %s -S -coro-early -inline -coro-elide | FileCheck %s + +declare void @print(i32) nounwind + +; resume part of the coroutine +define fastcc void @f.resume(i8*) { + tail call void @print(i32 1) + ret void +} + +; destroy part of the coroutine +define fastcc void @f.destroy(i8*) { + tail call void @print(i32 0) + ret void +} + +@f.resumers = internal constant [2 x void (i8*)*] [void (i8*)* @f.resume, + void (i8*)* @f.destroy] + +; a coroutine start function +define i8* @f() { +entry: + %hdl = call i8* @llvm.coro.begin(i8* null, i32 0, i8* null, + i8* bitcast ([2 x void (i8*)*]* @f.resumers to i8*)) + ret i8* %hdl +} + +; CHECK-LABEL: @callResume +define void @callResume() { +entry: +; CHECK: call i8* @llvm.coro.begin + %hdl = call i8* @f() + +; CHECK-NEXT: call void @print(i32 1) + call void @llvm.coro.resume(i8* %hdl) + +; CHECK-NEXT: call void @print(i32 0) + call void @llvm.coro.destroy(i8* %hdl) + +; CHECK-NEXT: ret void + ret void +} + +; CHECK-LABEL: @eh +define void @eh() personality i8* null { +entry: +; CHECK: call i8* @llvm.coro.begin + %hdl = call i8* @f() + +; CHECK-NEXT: call void @print(i32 1) + invoke void @llvm.coro.resume(i8* %hdl) + to label %cont unwind label %ehcleanup +cont: + ret void + +ehcleanup: + %0 = cleanuppad within none [] + cleanupret from %0 unwind to caller +} + +; CHECK-LABEL: @no_devirt_info_null +; no devirtualization here, since coro.begin info parameter is null +define void @no_devirt_info_null() { +entry: + %hdl = call i8* @llvm.coro.begin(i8* null, i32 0, i8* null, i8* null) + +; CHECK: call i8* @llvm.coro.subfn.addr(i8* %hdl, i8 0) + call void @llvm.coro.resume(i8* %hdl) + +; CHECK: call i8* @llvm.coro.subfn.addr(i8* %hdl, i8 1) + call void @llvm.coro.destroy(i8* %hdl) + +; CHECK: ret void + ret void +} + +; CHECK-LABEL: @no_devirt_no_begin +; no devirtualization here, since coro.begin is not visible +define void @no_devirt_no_begin(i8* %hdl) { +entry: +; CHECK: call i8* @llvm.coro.subfn.addr(i8* %hdl, i8 0) + call void @llvm.coro.resume(i8* %hdl) + +; CHECK: call i8* @llvm.coro.subfn.addr(i8* %hdl, i8 1) + call void @llvm.coro.destroy(i8* %hdl) + +; CHECK: ret void + ret void +} + + +declare void @llvm.coro.resume(i8*) +declare void @llvm.coro.destroy(i8*) +declare i8* @llvm.coro.begin(i8*, i32, i8*, i8*)