Diff 42234

lib/Transforms/IPO/FunctionImport.cpp

Show All 18 Lines
#include "llvm/IR/IntrinsicInst.h"		#include "llvm/IR/IntrinsicInst.h"
#include "llvm/IR/Module.h"		#include "llvm/IR/Module.h"
#include "llvm/IRReader/IRReader.h"		#include "llvm/IRReader/IRReader.h"
#include "llvm/Linker/Linker.h"		#include "llvm/Linker/Linker.h"
#include "llvm/Object/FunctionIndexObjectFile.h"		#include "llvm/Object/FunctionIndexObjectFile.h"
#include "llvm/Support/CommandLine.h"		#include "llvm/Support/CommandLine.h"
#include "llvm/Support/Debug.h"		#include "llvm/Support/Debug.h"
#include "llvm/Support/SourceMgr.h"		#include "llvm/Support/SourceMgr.h"

		#include <map>

using namespace llvm;		using namespace llvm;

#define DEBUG_TYPE "function-import"		#define DEBUG_TYPE "function-import"

/// Limit on instruction count of imported functions.		/// Limit on instruction count of imported functions.
static cl::opt<unsigned> ImportInstrLimit(		static cl::opt<unsigned> ImportInstrLimit(
"import-instr-limit", cl::init(100), cl::Hidden, cl::value_desc("N"),		"import-instr-limit", cl::init(100), cl::Hidden, cl::value_desc("N"),
cl::desc("Only import functions with less than N instructions"));		cl::desc("Only import functions with less than N instructions"));
Show All 10 Lines	static std::unique_ptr<Module> loadFile(const std::string &FileName,
}		}

Result->materializeMetadata();		Result->materializeMetadata();
UpgradeDebugInfo(*Result);		UpgradeDebugInfo(*Result);

return Result;		return Result;
}		}

		namespace {
		/// Helper to load on demand a Module from file and cache it for subsequent
		/// queries. It can be used with the FunctionImporter.
		class ModuleLazyLoaderCache {
		tejohnsonUnsubmitted Done Reply Inline Actions Remove tejohnson: Remove
		/// Cache of lazily loaded module for import.
		StringMap<std::unique_ptr<Module>> ModuleMap;

		/// Retrieve a Module from the cache or lazily load it on demand.
		std::function<std::unique_ptr<Module>(StringRef FileName)> createLazyModule;

		public:
		/// Create the loader, Module will be initialized in \p Context.
		ModuleLazyLoaderCache(std::function<
		std::unique_ptr<Module>(StringRef FileName)> createLazyModule)
		: createLazyModule(createLazyModule) {}

		/// Retrieve a Module from the cache or lazily load it on demand.
		Module &operator()(StringRef FileName);
		};

		// Get a Module for \p FileName from the cache, or load it lazily.
		Module &ModuleLazyLoaderCache::operator()(StringRef Identifier) {
		auto &Module = ModuleMap[Identifier];
		if (!Module)
		Module = createLazyModule(Identifier);
		return *Module;
		}
		} // anonymous namespace

/// Walk through the instructions in \p F looking for external		/// Walk through the instructions in \p F looking for external
/// calls not already in the \p CalledFunctions set. If any are		/// calls not already in the \p CalledFunctions set. If any are
/// found they are added to the \p Worklist for importing.		/// found they are added to the \p Worklist for importing.
static void findExternalCalls(const Function &F, StringSet<> &CalledFunctions,		static void findExternalCalls(const Module &DestModule, Function &F,
		const FunctionInfoIndex &Index,
		StringSet<> &CalledFunctions,
SmallVector<StringRef, 64> &Worklist) {		SmallVector<StringRef, 64> &Worklist) {
		// We need to suffix internal function calls imported from other modules,
		tejohnsonUnsubmitted Done Reply Inline Actions Maybe "...internal function calls imported from..."? I.e. at this point we have only imported the call. tejohnson: Maybe "...internal function calls imported from..."? I.e. at this point we have only imported…
		// prepare the suffix ahead of time.
		StringRef Suffix;
		if (F.getParent() != &DestModule)
		Suffix =
		(Twine(".llvm.") +
		Twine(Index.getModuleId(F.getParent()->getModuleIdentifier()))).str();

for (auto &BB : F) {		for (auto &BB : F) {
for (auto &I : BB) {		for (auto &I : BB) {
if (isa<CallInst>(I)) {		if (isa<CallInst>(I)) {
auto CalledFunction = cast<CallInst>(I).getCalledFunction();		auto CalledFunction = cast<CallInst>(I).getCalledFunction();
// Insert any new external calls that have not already been		// Insert any new external calls that have not already been
// added to set/worklist.		// added to set/worklist.
if (CalledFunction && CalledFunction->hasName() &&		if (!CalledFunction \|\| !CalledFunction->hasName())
CalledFunction->isDeclaration() &&		continue;
!CalledFunctions.count(CalledFunction->getName())) {		// Ignore intrinsics early
CalledFunctions.insert(CalledFunction->getName());		if (CalledFunction->isIntrinsic()) {
Worklist.push_back(CalledFunction->getName());		assert(CalledFunction->getIntrinsicID() != 0);
		continue;
		}
		auto ImportedName = CalledFunction->getName();
		auto Renamed = (ImportedName + Suffix).str();
		// Rename internal functions
		if (CalledFunction->hasInternalLinkage()) {
		ImportedName = Renamed;
		}
		auto It = CalledFunctions.insert(ImportedName);
		if (!It.second) {
		// This is a call to a function we already considered, skip.
		tejohnsonUnsubmitted Not Done Reply Inline Actions We will never reconsider a function after initially deciding it isn't profitable to import. Currently the only profitability decision is based on the number of instructions, which won't change with importing. But perhaps we should add a TODO down where we have those checks to remove any callees from the CalledFunctions list if they fail a profitability check that may be affected by additional importing decisions. tejohnson: We will never reconsider a function after initially deciding it isn't profitable to import.
		continue;
}		}
		#ifndef NDEBUG
		// Ignore functions already present in the destination module
		auto *SrcGV = DestModule.getNamedValue(ImportedName);
		tejohnsonUnsubmitted Done Reply Inline Actions We reach here if the function is already in the CalledFunctions set, so do we want to issue a message that we are ignoring it? It seems misleading, i.e. it sounds like we decided not to import. tejohnson: We reach here if the function is already in the CalledFunctions set, so do we want to issue a…
		if (SrcGV) {
		assert(isa<Function>(SrcGV) && "Name collision during import");
		if (!cast<Function>(SrcGV)->isDeclaration()) {
		DEBUG(dbgs() << DestModule.getModuleIdentifier() << "Ignoring "
		<< ImportedName << " already in DestinationModule\n");
		continue;
		}
		}
		#endif // NDEBUG

		Worklist.push_back(It.first->getKey());
		DEBUG(dbgs() << DestModule.getModuleIdentifier()
		tejohnsonUnsubmitted Done Reply Inline Actions Why is this under #ifndef NDEBUG? tejohnson: Why is this under #ifndef NDEBUG?
		<< " Adding callee for : " << ImportedName << " : "
		<< F.getName() << "\n");
}		}
}		}
}		}
}		}

// Helper function: given a worklist and an index, will process all the worklist		// Helper function: given a worklist and an index, will process all the worklist
// and import them based on the summary information		// and decide what to import based on the summary information.
static unsigned ProcessImportWorklist(		//
		// Nothing is actually imported, functions are materialized in their source
		// module and analyzed there.
		//
		// \p ModuleToFunctionsToImportMap is filled with the set of Function to import
		// per Module.
		static void GetImportList(
Module &DestModule, SmallVector<StringRef, 64> &Worklist,		Module &DestModule, SmallVector<StringRef, 64> &Worklist,
StringSet<> &CalledFunctions, Linker &TheLinker,		StringSet<> &CalledFunctions,
const FunctionInfoIndex &Index,		std::map<StringRef, std::pair<Module , DenseSet<const GlobalValue >>> &
std::function<std::unique_ptr<Module>(StringRef FileName)> &		ModuleToFunctionsToImportMap,
LazyModuleLoader) {		const FunctionInfoIndex &Index, ModuleLazyLoaderCache &ModuleLoaderCache) {
unsigned ImportCount = 0;
while (!Worklist.empty()) {		while (!Worklist.empty()) {
auto CalledFunctionName = Worklist.pop_back_val();		auto CalledFunctionName = Worklist.pop_back_val();
DEBUG(dbgs() << "Process import for " << CalledFunctionName << "\n");		DEBUG(dbgs() << "Process import for " << CalledFunctionName << "\n");

// Try to get a summary for this function call.		// Try to get a summary for this function call.
auto InfoList = Index.findFunctionInfoList(CalledFunctionName);		auto InfoList = Index.findFunctionInfoList(CalledFunctionName);
if (InfoList == Index.end()) {		if (InfoList == Index.end()) {
DEBUG(dbgs() << "No summary for " << CalledFunctionName		DEBUG(dbgs() << "No summary for " << CalledFunctionName
Show All 17 Lines	while (!Worklist.empty()) {
if (Summary->instCount() > ImportInstrLimit) {		if (Summary->instCount() > ImportInstrLimit) {
DEBUG(dbgs() << "Skip import of " << CalledFunctionName << " with "		DEBUG(dbgs() << "Skip import of " << CalledFunctionName << " with "
<< Summary->instCount() << " instructions (limit "		<< Summary->instCount() << " instructions (limit "
<< ImportInstrLimit << ")\n");		<< ImportInstrLimit << ")\n");
continue;		continue;
}		}

// Get the module path from the summary.		// Get the module path from the summary.
auto FileName = Summary->modulePath();		auto ModuleIdentifier = Summary->modulePath();
DEBUG(dbgs() << "Importing " << CalledFunctionName << " from " << FileName		DEBUG(dbgs() << DestModule.getModuleIdentifier() << " Importing "
<< "\n");		<< CalledFunctionName << " from " << ModuleIdentifier << "\n");

// Get the module for the import		auto &SrcModule = ModuleLoaderCache(ModuleIdentifier);
auto SrcModule = LazyModuleLoader(FileName);
assert(&SrcModule->getContext() == &DestModule.getContext());

// The function that we will import!		// The function that we will import!
GlobalValue *SGV = SrcModule->getNamedValue(CalledFunctionName);		GlobalValue *SGV = SrcModule.getNamedValue(CalledFunctionName);
StringRef ImportFunctionName = CalledFunctionName;
if (!SGV) {		if (!SGV) {
// Might be local in source Module, promoted/renamed in DestModule.		// The destination module is referencing function using their renamed name
		// when importing a function that was originally local in the source
		// module. The source module we have might not have been renamed so we try
		// to remove the suffix added during the renaming to recover the original
		// name in the source module.
std::pair<StringRef, StringRef> Split =		std::pair<StringRef, StringRef> Split =
CalledFunctionName.split(".llvm.");		CalledFunctionName.split(".llvm.");
SGV = SrcModule->getNamedValue(Split.first);		SGV = SrcModule.getNamedValue(Split.first);
#ifndef NDEBUG		assert(SGV && "Can't find function to import in source module");
// Assert that Split.second is module id
uint64_t ModuleId;
assert(!Split.second.getAsInteger(10, ModuleId));
assert(ModuleId == Index.getModuleId(FileName));
#endif
}		}
		if (!SGV) {
		report_fatal_error(Twine("Can't load function '") + CalledFunctionName +
		"' in Module '" + SrcModule.getModuleIdentifier() +
		"', error in the summary?\n");
		}

Function *F = dyn_cast<Function>(SGV);		Function *F = dyn_cast<Function>(SGV);
if (!F && isa<GlobalAlias>(SGV)) {		if (!F && isa<GlobalAlias>(SGV)) {
auto *SGA = dyn_cast<GlobalAlias>(SGV);		auto *SGA = dyn_cast<GlobalAlias>(SGV);
F = dyn_cast<Function>(SGA->getBaseObject());		F = dyn_cast<Function>(SGA->getBaseObject());
ImportFunctionName = F->getName();		CalledFunctionName = F->getName();
}
if (!F) {
errs() << "Can't load function '" << CalledFunctionName << "' in Module '"
<< FileName << "', error in the summary?\n";
llvm_unreachable("Can't load function in Module");
}		}
		assert(F && "Imported Function is ... not a Function");

// We cannot import weak_any functions/aliases without possibly affecting		// We cannot import weak_any functions/aliases without possibly affecting
// the order they are seen and selected by the linker, changing program		// the order they are seen and selected by the linker, changing program
// semantics.		// semantics.
if (SGV->hasWeakAnyLinkage()) {		if (SGV->hasWeakAnyLinkage()) {
DEBUG(dbgs() << "Ignoring import request for weak-any "		DEBUG(dbgs() << "Ignoring import request for weak-any "
<< (isa<Function>(SGV) ? "function " : "alias ")		<< (isa<Function>(SGV) ? "function " : "alias ")
<< CalledFunctionName << " from " << FileName << "\n");		<< CalledFunctionName << " from "
		<< SrcModule.getModuleIdentifier() << "\n");
continue;		continue;
}		}

// Link in the specified function.		// Add the function to the import list
DenseSet<const GlobalValue *> FunctionsToImport;		auto &Entry = ModuleToFunctionsToImportMap[SrcModule.getModuleIdentifier()];
FunctionsToImport.insert(F);		Entry.first = &SrcModule;
if (TheLinker.linkInModule(*SrcModule, Linker::Flags::None, &Index,		Entry.second.insert(F);
&FunctionsToImport))
		tejohnsonUnsubmitted Done Reply Inline Actions How do you ensure that F is materialized in the lazy-loaded SrcModule? With the current code at HEAD it is the dest copy we walk, which was materialized in the source and then copied over during module linking. Another issue with using the source copy here - the local functions haven't been renamed/promoted, so there may be apparent duplicates in CalledFunctions due to same-named local functions from other modules. tejohnson: How do you ensure that F is materialized in the lazy-loaded SrcModule? With the current code at…
report_fatal_error("Function Import: link error");		// Process the newly imported functions and add callees to the worklist.
		F->materialize();
// Process the newly imported function and add callees to the worklist.		findExternalCalls(DestModule, *F, Index, CalledFunctions, Worklist);
GlobalValue *NewGV = DestModule.getNamedValue(ImportFunctionName);
assert(NewGV);
Function *NewF = dyn_cast<Function>(NewGV);
assert(NewF);
findExternalCalls(*NewF, CalledFunctions, Worklist);
++ImportCount;
}		}
return ImportCount;
}		}

// Automatically import functions in Module \p DestModule based on the summaries		// Automatically import functions in Module \p DestModule based on the summaries
// index.		// index.
//		//
// The current implementation imports every called functions that exists in the		// The current implementation imports every called functions that exists in the
// summaries index.		// summaries index.
bool FunctionImporter::importFunctions(Module &DestModule) {		bool FunctionImporter::importFunctions(Module &DestModule) {
DEBUG(errs() << "Starting import for Module "		DEBUG(errs() << "Starting import for Module "
<< DestModule.getModuleIdentifier() << "\n");		<< DestModule.getModuleIdentifier() << "\n");
unsigned ImportedCount = 0;		unsigned ImportedCount = 0;

/// First step is collecting the called external functions.		/// First step is collecting the called external functions.
StringSet<> CalledFunctions;		StringSet<> CalledFunctions;
SmallVector<StringRef, 64> Worklist;		SmallVector<StringRef, 64> Worklist;
for (auto &F : DestModule) {		for (auto &F : DestModule) {
if (F.isDeclaration() \|\| F.hasFnAttribute(Attribute::OptimizeNone))		if (F.isDeclaration() \|\| F.hasFnAttribute(Attribute::OptimizeNone))
continue;		continue;
findExternalCalls(F, CalledFunctions, Worklist);		findExternalCalls(DestModule, F, Index, CalledFunctions, Worklist);
}		}
if (Worklist.empty())		if (Worklist.empty())
return false;		return false;

/// Second step: for every call to an external function, try to import it.		/// Second step: for every call to an external function, try to import it.

// Linker that will be used for importing function		// Linker that will be used for importing function
Linker TheLinker(DestModule, DiagnosticHandler);		Linker TheLinker(DestModule, DiagnosticHandler);

ImportedCount += ProcessImportWorklist(DestModule, Worklist, CalledFunctions,		// Map of Module -> List of Function to import from the Module
TheLinker, Index, ModuleLoader);		std::map<StringRef, std::pair<Module , DenseSet<const GlobalValue >>>
		ModuleToFunctionsToImportMap;

		// Analyze the summaries and get the list of functions to import by
		tejohnsonUnsubmitted Done Reply Inline Actions Comment reads funny: "helps required by" tejohnson: Comment reads funny: "helps required by"
		// populating ModuleToFunctionsToImportMap
		ModuleLazyLoaderCache ModuleLoaderCache(ModuleLoader);
		GetImportList(DestModule, Worklist, CalledFunctions,
		ModuleToFunctionsToImportMap, Index, ModuleLoaderCache);
		assert(Worklist.empty() && "Worklist hasn't been flushed in GetImportList");
		tejohnsonUnsubmitted Done Reply Inline Actions I don't see anything called ProcessImportWorklist? Do you mean GetImportList? Each iteration of what? tejohnson: I don't see anything called ProcessImportWorklist? Do you mean GetImportList? Each iteration of…

		// Do the actual import of functions now, one Module at a time
		for (auto &FunctionsToImportPerModule : ModuleToFunctionsToImportMap) {
		// Get the module for the import
		auto &FunctionsToImport = FunctionsToImportPerModule.second.second;
		auto *SrcModule = FunctionsToImportPerModule.second.first;
		assert(&DestModule.getContext() == &SrcModule->getContext() &&
		"Context mismatch");

		// Link in the specified functions.
		if (TheLinker.linkInModule(*SrcModule, Linker::Flags::None, &Index,
		&FunctionsToImport))
		report_fatal_error("Function Import: link error");

DEBUG(errs() << "Imported " << ImportedCount << " functions for Module "		ImportedCount += FunctionsToImport.size();
		}
		DEBUG(dbgs() << "Imported " << ImportedCount << " functions for Module "
<< DestModule.getModuleIdentifier() << "\n");		<< DestModule.getModuleIdentifier() << "\n");
return ImportedCount;		return ImportedCount;
}		}

/// Summary file to use for function importing when using -function-import from		/// Summary file to use for function importing when using -function-import from
/// the command line.		/// the command line.
static cl::opt<std::string>		static cl::opt<std::string>
SummaryFile("summary-file",		SummaryFile("summary-file",
▲ Show 20 Lines • Show All 90 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

FunctionImporter: implement bulk function importing for efficiency
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 42234

lib/Transforms/IPO/FunctionImport.cpp

This is an archive of the discontinued LLVM Phabricator instance.

FunctionImporter: implement bulk function importing for efficiencyClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 42234

lib/Transforms/IPO/FunctionImport.cpp

FunctionImporter: implement bulk function importing for efficiency
ClosedPublic