Index: include/llvm/Analysis/CallGraph.h =================================================================== --- include/llvm/Analysis/CallGraph.h +++ include/llvm/Analysis/CallGraph.h @@ -47,6 +47,7 @@ #define LLVM_ANALYSIS_CALLGRAPH_H #include "llvm/ADT/GraphTraits.h" +#include "llvm/ADT/MapVector.h" #include "llvm/ADT/STLExtras.h" #include "llvm/IR/CallSite.h" #include "llvm/IR/Function.h" @@ -77,9 +78,22 @@ using FunctionMapTy = std::map>; + /// \brief A type for maintaining dummy nodes. + /// + /// Dummy nodes (i.e., nodes having a null function) include, for example, + /// those created to represent !callees metadata. We use a void pointer as + /// the key to allow for various kinds of dummy nodes. We use a MapVector to + /// ensure a deterministic iteration order (there's no good way to sort dummy + /// nodes). A deterministic iteration order is primarily useful for printing. + using DummyNodeMapTy = + MapVector>; + /// \brief A map from \c Function* to \c CallGraphNode*. FunctionMapTy FunctionMap; + /// \brief A map for maintaining dummy nodes. + DummyNodeMapTy DummyNodeMap; + /// \brief This node has edges to all external functions and those internal /// functions that have their address taken. CallGraphNode *ExternalCallingNode; @@ -99,6 +113,9 @@ /// functions that it calls. void addToCallGraph(Function *F); + /// \brief Return the dummy node associated with the given pointer. + CallGraphNode *getOrInsertDummyNode(const void *P); + public: explicit CallGraph(Module &M); CallGraph(CallGraph &&Arg); Index: include/llvm/IR/CallSite.h =================================================================== --- include/llvm/IR/CallSite.h +++ include/llvm/IR/CallSite.h @@ -653,6 +653,35 @@ return false; } + /// Return the set of functions this call site is known to call. For direct + /// calls, the returned set contains the called function. For indirect calls, + /// this function collects known callees from !callees metadata, if present. + SmallVector getKnownCallees() { + SmallVector Callees; + InstrTy *Inst = getInstruction(); + if (getCalledFunction()) { + // If the call site is direct, just add the called function to the set. + Callees.push_back(getCalledFunction()); + } else if (auto *Node = Inst->getMetadata(LLVMContext::MD_callees)) { + // Otherwise, if the call site is indirect, collect the known callees from + // !callees metadata if present. + for (const MDOperand &Op : Node->operands()) + if (auto *MDConstant = mdconst::extract_or_null(Op)) + Callees.push_back(cast(MDConstant->stripPointerCasts())); + if (!Callees.empty()) { + // Ensure a stable iteration order over the known callees. To do this, + // we sort the functions by name. + std::sort(Callees.begin(), Callees.end(), + [](const Function *RHS, const Function *LHS) { + return RHS->getName() < LHS->getName(); + }); + Callees.erase(std::unique(Callees.begin(), Callees.end()), + Callees.end()); + } + } + return Callees; + } + private: IterTy getCallee() const { if (isCall()) // Skip Callee Index: lib/Analysis/CGSCCPassManager.cpp =================================================================== --- lib/Analysis/CGSCCPassManager.cpp +++ lib/Analysis/CGSCCPassManager.cpp @@ -428,7 +428,7 @@ // irrelevant. for (Instruction &I : instructions(F)) if (auto CS = CallSite(&I)) - if (Function *Callee = CS.getCalledFunction()) + for (Function *Callee : CS.getKnownCallees()) if (Visited.insert(Callee).second && !Callee->isDeclaration()) { Node &CalleeN = *G.lookup(*Callee); Edge *E = N->lookup(CalleeN); Index: lib/Analysis/CallGraph.cpp =================================================================== --- lib/Analysis/CallGraph.cpp +++ lib/Analysis/CallGraph.cpp @@ -38,6 +38,7 @@ CallGraph::CallGraph(CallGraph &&Arg) : M(Arg.M), FunctionMap(std::move(Arg.FunctionMap)), + DummyNodeMap(std::move(Arg.DummyNodeMap)), ExternalCallingNode(Arg.ExternalCallingNode), CallsExternalNode(std::move(Arg.CallsExternalNode)) { Arg.FunctionMap.clear(); @@ -54,6 +55,8 @@ #ifndef NDEBUG for (auto &I : FunctionMap) I.second->allReferencesDropped(); + for (auto &I : DummyNodeMap) + I.second->allReferencesDropped(); #endif } @@ -75,13 +78,28 @@ for (Instruction &I : BB) { if (auto CS = CallSite(&I)) { const Function *Callee = CS.getCalledFunction(); - if (!Callee || !Intrinsic::isLeaf(Callee->getIntrinsicID())) + MDNode *CalleesMDNode = I.getMetadata(LLVMContext::MD_callees); + if (!Callee && CalleesMDNode) { + // If an indirect call site has !callees metadata indicating its + // possible callees, we add an edge from the call site to a dummy + // node. When we construct the dummy node, we add edges from it to + // the functions indicated in the !callees metadata. + bool InitCallees = !DummyNodeMap.count(CalleesMDNode); + CallGraphNode *Dummy = getOrInsertDummyNode(CalleesMDNode); + Node->addCalledFunction(CS, Dummy); + if (InitCallees) + for (Function *PossibleCallee : CS.getKnownCallees()) + if (!PossibleCallee->isIntrinsic()) + Dummy->addCalledFunction(CallSite(), + getOrInsertFunction(PossibleCallee)); + } else if (!Callee || !Intrinsic::isLeaf(Callee->getIntrinsicID())) { // Indirect calls of intrinsics are not allowed so no need to check. // We can be more precise here by using TargetArg returned by // Intrinsic::isLeaf. Node->addCalledFunction(CS, CallsExternalNode.get()); - else if (!Callee->isIntrinsic()) + } else if (!Callee->isIntrinsic()) { Node->addCalledFunction(CS, getOrInsertFunction(Callee)); + } } } } @@ -107,6 +125,11 @@ for (CallGraphNode *CN : Nodes) CN->print(OS); + + // The iteration order of the DummyNodeMap is deterministic, so we don't need + // to sort the nodes. Just print them. + for (auto &Entry : DummyNodeMap) + Entry.second->print(OS); } #if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP) @@ -122,6 +145,12 @@ Function *CallGraph::removeFunctionFromModule(CallGraphNode *CGN) { assert(CGN->empty() && "Cannot remove function from call " "graph if it references other functions!"); + + // If any dummy node references the node for the given function, we first + // need to remove those edges. + for (auto &Entry : DummyNodeMap) + Entry.second->removeAnyCallEdgeTo(CGN); + Function *F = CGN->getFunction(); // Get the function for the call graph node FunctionMap.erase(F); // Remove the call graph node from the map @@ -156,6 +185,14 @@ return CGN.get(); } +CallGraphNode *CallGraph::getOrInsertDummyNode(const void *P) { + auto &CGN = DummyNodeMap[P]; + if (CGN) + return CGN.get(); + CGN = llvm::make_unique(nullptr); + return CGN.get(); +} + //===----------------------------------------------------------------------===// // Implementations of the CallGraphNode class methods. // @@ -173,7 +210,7 @@ if (Function *FI = I.second->getFunction()) OS << "function '" << FI->getName() <<"'\n"; else - OS << "external node\n"; + OS << "<><<" << I.second << ">>\n"; } OS << '\n'; } Index: lib/Analysis/LazyCallGraph.cpp =================================================================== --- lib/Analysis/LazyCallGraph.cpp +++ lib/Analysis/LazyCallGraph.cpp @@ -100,12 +100,14 @@ for (BasicBlock &BB : *F) for (Instruction &I : BB) { if (auto CS = CallSite(&I)) - if (Function *Callee = CS.getCalledFunction()) + for (Function *Callee : CS.getKnownCallees()) if (!Callee->isDeclaration()) if (Callees.insert(Callee).second) { Visited.insert(Callee); + auto EdgeK = CS.getCalledFunction() ? LazyCallGraph::Edge::Call + : LazyCallGraph::Edge::Ref; addEdge(Edges->Edges, Edges->EdgeIndexMap, G->get(*Callee), - LazyCallGraph::Edge::Call); + EdgeK); } for (Value *Op : I.operand_values()) Index: test/Analysis/CallGraph/callees-metadata.ll =================================================================== --- /dev/null +++ test/Analysis/CallGraph/callees-metadata.ll @@ -0,0 +1,33 @@ +; RUN: opt < %s -print-callgraph -disable-output 2>&1 | FileCheck %s + +; CHECK: Call graph node <><<{{.+}}>> #uses=0 +; CHECK-DAG: CS<0x0> calls function 'main' +; CHECK-DAG: CS<0x0> calls function 'add' +; CHECK-DAG: CS<0x0> calls function 'sub' +; +; CHECK: Call graph node for function: 'add'<<{{.+}}>> #uses=2 +; +; CHECK: Call graph node for function: 'main'<<{{.+}}>> #uses=1 +; CHECK-NEXT: CS<{{.+}}> calls <><<[[CALLEES:.+]]>> +; +; CHECK: Call graph node for function: 'sub'<<{{.+}}>> #uses=2 +; +; CHECK: Call graph node <><<[[CALLEES]]>> #uses=1 +; CHECK-DAG: CS<0x0> calls function 'add' +; CHECK-DAG: CS<0x0> calls function 'sub' + +define i64 @main(i64 %x, i64 %y, i64 (i64, i64)* %binop) { + %tmp0 = call i64 %binop(i64 %x, i64 %y), + !callees !{i64 (i64, i64)* @add, i64 (i64, i64)* @sub} + ret i64 %tmp0 +} + +define i64 @add(i64 %x, i64 %y) { + %tmp0 = add i64 %x, %y + ret i64 %tmp0 +} + +define i64 @sub(i64 %x, i64 %y) { + %tmp0 = sub i64 %x, %y + ret i64 %tmp0 +} Index: test/Analysis/CallGraph/non-leaf-intrinsics.ll =================================================================== --- test/Analysis/CallGraph/non-leaf-intrinsics.ll +++ test/Analysis/CallGraph/non-leaf-intrinsics.ll @@ -26,7 +26,7 @@ ; CHECK: CS<0x0> calls function 'f' ; CHECK: Call graph node for function: 'calls_patchpoint' -; CHECK-NEXT: CS<[[addr_1:[^>]+]]> calls external node +; CHECK-NEXT: CS<[[addr_1:[^>]+]]> calls <> ; CHECK: Call graph node for function: 'calls_statepoint' -; CHECK-NEXT: CS<[[addr_0:[^>]+]]> calls external node +; CHECK-NEXT: CS<[[addr_0:[^>]+]]> calls <> Index: test/Analysis/LazyCallGraph/callees-metadata.ll =================================================================== --- /dev/null +++ test/Analysis/LazyCallGraph/callees-metadata.ll @@ -0,0 +1,37 @@ +; RUN: opt < %s -passes=print-lcg -disable-output 2>&1 | FileCheck %s + +; CHECK: Edges in function: main +; CHECK-DAG: ref -> add +; CHECK-DAG: ref -> sub +; +; CHECK: Edges in function: add +; +; CHECK: Edges in function: sub +; +; CHECK: RefSCC with 1 call SCCs: +; CHECK-NEXT: SCC with 1 functions: +; CHECK-NEXT: sub +; +; CHECK: RefSCC with 1 call SCCs: +; CHECK-NEXT: SCC with 1 functions: +; CHECK-NEXT: add +; +; CHECK: RefSCC with 1 call SCCs: +; CHECK-NEXT: SCC with 1 functions: +; CHECK-NEXT: main + +define i64 @main(i64 %x, i64 %y, i64 (i64, i64)* %binop) { + %tmp0 = call i64 %binop(i64 %x, i64 %y), + !callees !{i64 (i64, i64)* @add, i64 (i64, i64)* @sub} + ret i64 %tmp0 +} + +define i64 @add(i64 %x, i64 %y) { + %tmp0 = add i64 %x, %y + ret i64 %tmp0 +} + +define i64 @sub(i64 %x, i64 %y) { + %tmp0 = sub i64 %x, %y + ret i64 %tmp0 +}