This is an archive of the discontinued LLVM Phabricator instance.

Implement selective bitcode linking and internalization of linked symbols
ClosedPublic

Authored by tra on Aug 28 2015, 4:45 PM.

Download Raw Diff

Details

Reviewers

tra
pcc
echristo
dexonsmith

Commits

rG020d4fb17f92: New bitcode linker flags:
rL246561: New bitcode linker flags:

Summary

In order to support CUDA we need a way to link in subset of functions from bitcode library.

Current way to do that suggested in NVPTX guide (http://llvm.org/docs/NVPTXUsage.html) requires linking in complete library, internalizing all symbols except those that were originally present in TU before linking and running GDCE pass to eliminate bitcode we don't need.

Considering that we only need fairly small subset of functions from the library, better way to do that would be to directly link in only the symbols needed by the destination module and internalize them in process, if required.

This patch adds two new linker flags to do exactly that.

-only-needed -- links in only symbols needed by destination module
-internalize -- internalize linked symbols.

Diff Detail

Repository: rL LLVM

Event Timeline

tra updated this revision to Diff 33254.Aug 28 2015, 4:45 PM

tra retitled this revision from to Implement selective bitcode linking and internalization of linked symbols.

tra updated this object.

tra added reviewers: echristo, dexonsmith, pcc.

tra added a subscriber: llvm-commits.

Herald added a subscriber: jholewinski. · View Herald TranscriptAug 28 2015, 4:45 PM

tra added inline comments.Aug 28 2015, 4:47 PM

lib/Target/NVPTX/NVPTXTargetMachine.cpp
184–186 ↗	(On Diff #33254)	This change was included by mistake. I'll update the patch shortly to remove it.

Removed changes included by mistake.

Fixed a nit spotted by dexonsmith@.

LGTM by dexonsmith@ on llvm-commits list.

This revision is now accepted and ready to land.Sep 1 2015, 10:56 AM

Closed by commit rL246561: New bitcode linker flags: (authored by tra). · Explain WhySep 1 2015, 10:57 AM

This revision was automatically updated to reflect the committed changes.

Revision Contents

Path

Size

llvm/

trunk/

include/

llvm/

Linker/

Linker.h

15 lines

lib/

Linker/

LinkModules.cpp

46 lines

test/

Linker/

Inputs/

linkage.c.ll

4 lines

link-flags.ll

21 lines

tools/

llvm-link/

llvm-link.cpp

25 lines

Diff 33711

llvm/trunk/include/llvm/Linker/Linker.h

Show First 20 Lines • Show All 54 Lines • ▼ Show 20 Lines	struct IdentifiedStructTypeSet {

void addNonOpaque(StructType *Ty);		void addNonOpaque(StructType *Ty);
void switchToNonOpaque(StructType *Ty);		void switchToNonOpaque(StructType *Ty);
void addOpaque(StructType *Ty);		void addOpaque(StructType *Ty);
StructType findNonOpaque(ArrayRef<Type > ETypes, bool IsPacked);		StructType findNonOpaque(ArrayRef<Type > ETypes, bool IsPacked);
bool hasType(StructType *Ty);		bool hasType(StructType *Ty);
};		};

		enum Flags {
		None = 0,
		OverrideFromSrc = (1 << 0),
		LinkOnlyNeeded = (1 << 1),
		InternalizeLinkedSymbols = (1 << 2)
		};

Linker(Module *M, DiagnosticHandlerFunction DiagnosticHandler);		Linker(Module *M, DiagnosticHandlerFunction DiagnosticHandler);
Linker(Module *M);		Linker(Module *M);

Module *getModule() const { return Composite; }		Module *getModule() const { return Composite; }
void deleteModule();		void deleteModule();

/// \brief Link \p Src into the composite. The source is destroyed.		/// \brief Link \p Src into the composite. The source is destroyed.
/// Passing OverrideSymbols as true will have symbols from Src		/// Passing OverrideSymbols as true will have symbols from Src
/// shadow those in the Dest.		/// shadow those in the Dest.
/// Returns true on error.		/// Returns true on error.
bool linkInModule(Module *Src, bool OverrideSymbols = false);		bool linkInModule(Module *Src, unsigned Flags = Flags::None);

/// \brief Set the composite to the passed-in module.		/// \brief Set the composite to the passed-in module.
void setModule(Module *Dst);		void setModule(Module *Dst);

static bool LinkModules(Module Dest, Module Src,		static bool LinkModules(Module Dest, Module Src,
DiagnosticHandlerFunction DiagnosticHandler);		DiagnosticHandlerFunction DiagnosticHandler,
		unsigned Flags = Flags::None);

static bool LinkModules(Module Dest, Module Src);		static bool LinkModules(Module Dest, Module Src,
		unsigned Flags = Flags::None);

private:		private:
void init(Module *M, DiagnosticHandlerFunction DiagnosticHandler);		void init(Module *M, DiagnosticHandlerFunction DiagnosticHandler);
Module *Composite;		Module *Composite;

IdentifiedStructTypeSet IdentifiedStructTypes;		IdentifiedStructTypeSet IdentifiedStructTypes;

DiagnosticHandlerFunction DiagnosticHandler;		DiagnosticHandlerFunction DiagnosticHandler;
};		};

} // End llvm namespace		} // End llvm namespace

#endif		#endif

llvm/trunk/lib/Linker/LinkModules.cpp

Show First 20 Lines • Show All 419 Lines • ▼ Show 20 Lines	class ModuleLinker {
std::vector<GlobalValue *> LazilyLinkGlobalValues;		std::vector<GlobalValue *> LazilyLinkGlobalValues;

/// Functions that have replaced other functions.		/// Functions that have replaced other functions.
SmallPtrSet<const Function *, 16> OverridingFunctions;		SmallPtrSet<const Function *, 16> OverridingFunctions;

DiagnosticHandlerFunction DiagnosticHandler;		DiagnosticHandlerFunction DiagnosticHandler;

/// For symbol clashes, prefer those from Src.		/// For symbol clashes, prefer those from Src.
bool OverrideFromSrc;		unsigned Flags;

public:		public:
ModuleLinker(Module dstM, Linker::IdentifiedStructTypeSet &Set, Module srcM,		ModuleLinker(Module dstM, Linker::IdentifiedStructTypeSet &Set, Module srcM,
DiagnosticHandlerFunction DiagnosticHandler,		DiagnosticHandlerFunction DiagnosticHandler, unsigned Flags)
bool OverrideFromSrc)
: DstM(dstM), SrcM(srcM), TypeMap(Set),		: DstM(dstM), SrcM(srcM), TypeMap(Set),
ValMaterializer(TypeMap, DstM, LazilyLinkGlobalValues),		ValMaterializer(TypeMap, DstM, LazilyLinkGlobalValues),
DiagnosticHandler(DiagnosticHandler), OverrideFromSrc(OverrideFromSrc) {		DiagnosticHandler(DiagnosticHandler), Flags(Flags) {}
}

bool run();		bool run();

		bool shouldOverrideFromSrc() { return Flags & Linker::OverrideFromSrc; }
		bool shouldLinkOnlyNeeded() { return Flags & Linker::LinkOnlyNeeded; }
		bool shouldInternalizeLinkedSymbols() {
		return Flags & Linker::InternalizeLinkedSymbols;
		}

private:		private:
bool shouldLinkFromSource(bool &LinkFromSrc, const GlobalValue &Dest,		bool shouldLinkFromSource(bool &LinkFromSrc, const GlobalValue &Dest,
const GlobalValue &Src);		const GlobalValue &Src);

/// Helper method for setting a message and returning an error code.		/// Helper method for setting a message and returning an error code.
bool emitError(const Twine &Message) {		bool emitError(const Twine &Message) {
DiagnosticHandler(LinkDiagnosticInfo(DS_Error, Message));		DiagnosticHandler(LinkDiagnosticInfo(DS_Error, Message));
return true;		return true;
▲ Show 20 Lines • Show All 276 Lines • ▼ Show 20 Lines	bool ModuleLinker::getComdatResult(const Comdat *SrcC,
return computeResultingSelectionKind(ComdatName, SSK, DSK, Result,		return computeResultingSelectionKind(ComdatName, SSK, DSK, Result,
LinkFromSrc);		LinkFromSrc);
}		}

bool ModuleLinker::shouldLinkFromSource(bool &LinkFromSrc,		bool ModuleLinker::shouldLinkFromSource(bool &LinkFromSrc,
const GlobalValue &Dest,		const GlobalValue &Dest,
const GlobalValue &Src) {		const GlobalValue &Src) {
// Should we unconditionally use the Src?		// Should we unconditionally use the Src?
if (OverrideFromSrc) {		if (shouldOverrideFromSrc()) {
LinkFromSrc = true;		LinkFromSrc = true;
return false;		return false;
}		}

// We always have to add Src if it has appending linkage.		// We always have to add Src if it has appending linkage.
if (Src.hasAppendingLinkage()) {		if (Src.hasAppendingLinkage()) {
LinkFromSrc = true;		LinkFromSrc = true;
return false;		return false;
▲ Show 20 Lines • Show All 334 Lines • ▼ Show 20 Lines	if (!LinkFromSrc && !DGV)
return false;		return false;

GlobalValue *NewGV;		GlobalValue *NewGV;
if (!LinkFromSrc) {		if (!LinkFromSrc) {
NewGV = DGV;		NewGV = DGV;
} else {		} else {
// If the GV is to be lazily linked, don't create it just yet.		// If the GV is to be lazily linked, don't create it just yet.
// The ValueMaterializerTy will deal with creating it if it's used.		// The ValueMaterializerTy will deal with creating it if it's used.
if (!DGV && !OverrideFromSrc &&		if (!DGV && !shouldOverrideFromSrc() &&
(SGV->hasLocalLinkage() \|\| SGV->hasLinkOnceLinkage() \|\|		(SGV->hasLocalLinkage() \|\| SGV->hasLinkOnceLinkage() \|\|
SGV->hasAvailableExternallyLinkage())) {		SGV->hasAvailableExternallyLinkage())) {
DoNotLinkFromSource.insert(SGV);		DoNotLinkFromSource.insert(SGV);
return false;		return false;
}		}

		// When we only want to link in unresolved dependencies, blacklist
		// the symbol unless unless DestM has a matching declaration (DGV).
		if (shouldLinkOnlyNeeded() && !(DGV && DGV->isDeclaration())) {
		DoNotLinkFromSource.insert(SGV);
		return false;
		}

NewGV = copyGlobalValueProto(TypeMap, *DstM, SGV);		NewGV = copyGlobalValueProto(TypeMap, *DstM, SGV);

if (DGV && isa<Function>(DGV))		if (DGV && isa<Function>(DGV))
if (auto *NewF = dyn_cast<Function>(NewGV))		if (auto *NewF = dyn_cast<Function>(NewGV))
OverridingFunctions.insert(NewF);		OverridingFunctions.insert(NewF);
}		}

NewGV->setUnnamedAddr(HasUnnamedAddr);		NewGV->setUnnamedAddr(HasUnnamedAddr);
▲ Show 20 Lines • Show All 145 Lines • ▼ Show 20 Lines	void ModuleLinker::linkAliasBody(GlobalAlias &Dst, GlobalAlias &Src) {
Constant *Val = MapValue(Aliasee, ValueMap, RF_MoveDistinctMDs, &TypeMap,		Constant *Val = MapValue(Aliasee, ValueMap, RF_MoveDistinctMDs, &TypeMap,
&ValMaterializer);		&ValMaterializer);
Dst.setAliasee(Val);		Dst.setAliasee(Val);
}		}

bool ModuleLinker::linkGlobalValueBody(GlobalValue &Src) {		bool ModuleLinker::linkGlobalValueBody(GlobalValue &Src) {
Value *Dst = ValueMap[&Src];		Value *Dst = ValueMap[&Src];
assert(Dst);		assert(Dst);
		if (shouldInternalizeLinkedSymbols())
		if (auto *DGV = dyn_cast<GlobalValue>(Dst))
		DGV->setLinkage(GlobalValue::InternalLinkage);
if (auto *F = dyn_cast<Function>(&Src))		if (auto *F = dyn_cast<Function>(&Src))
return linkFunctionBody(cast<Function>(Dst), F);		return linkFunctionBody(cast<Function>(Dst), F);
if (auto *GVar = dyn_cast<GlobalVariable>(&Src)) {		if (auto *GVar = dyn_cast<GlobalVariable>(&Src)) {
linkGlobalInit(cast<GlobalVariable>(Dst), GVar);		linkGlobalInit(cast<GlobalVariable>(Dst), GVar);
return false;		return false;
}		}
linkAliasBody(cast<GlobalAlias>(*Dst), cast<GlobalAlias>(Src));		linkAliasBody(cast<GlobalAlias>(*Dst), cast<GlobalAlias>(Src));
return false;		return false;
▲ Show 20 Lines • Show All 367 Lines • ▼ Show 20 Lines	for (GlobalVariable &Src : SrcM->globals()) {
linkGlobalValueBody(Src);		linkGlobalValueBody(Src);
}		}

// Process vector of lazily linked in functions.		// Process vector of lazily linked in functions.
while (!LazilyLinkGlobalValues.empty()) {		while (!LazilyLinkGlobalValues.empty()) {
GlobalValue *SGV = LazilyLinkGlobalValues.back();		GlobalValue *SGV = LazilyLinkGlobalValues.back();
LazilyLinkGlobalValues.pop_back();		LazilyLinkGlobalValues.pop_back();

		// Skip declarations that ValueMaterializer may have created in
		// case we link in only some of SrcM.
		if (shouldLinkOnlyNeeded() && SGV->isDeclaration())
		continue;

assert(!SGV->isDeclaration() && "users should not pass down decls");		assert(!SGV->isDeclaration() && "users should not pass down decls");
if (linkGlobalValueBody(*SGV))		if (linkGlobalValueBody(*SGV))
return true;		return true;
}		}

return false;		return false;
}		}

▲ Show 20 Lines • Show All 111 Lines • ▼ Show 20 Lines	Linker::Linker(Module *M) {
});		});
}		}

void Linker::deleteModule() {		void Linker::deleteModule() {
delete Composite;		delete Composite;
Composite = nullptr;		Composite = nullptr;
}		}

bool Linker::linkInModule(Module *Src, bool OverrideSymbols) {		bool Linker::linkInModule(Module *Src, unsigned Flags) {
ModuleLinker TheLinker(Composite, IdentifiedStructTypes, Src,		ModuleLinker TheLinker(Composite, IdentifiedStructTypes, Src,
DiagnosticHandler, OverrideSymbols);		DiagnosticHandler, Flags);
bool RetCode = TheLinker.run();		bool RetCode = TheLinker.run();
Composite->dropTriviallyDeadConstantArrays();		Composite->dropTriviallyDeadConstantArrays();
return RetCode;		return RetCode;
}		}

void Linker::setModule(Module *Dst) {		void Linker::setModule(Module *Dst) {
init(Dst, DiagnosticHandler);		init(Dst, DiagnosticHandler);
}		}

//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//
// LinkModules entrypoint.		// LinkModules entrypoint.
//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//

/// This function links two modules together, with the resulting Dest module		/// This function links two modules together, with the resulting Dest module
/// modified to be the composite of the two input modules. If an error occurs,		/// modified to be the composite of the two input modules. If an error occurs,
/// true is returned and ErrorMsg (if not null) is set to indicate the problem.		/// true is returned and ErrorMsg (if not null) is set to indicate the problem.
/// Upon failure, the Dest module could be in a modified state, and shouldn't be		/// Upon failure, the Dest module could be in a modified state, and shouldn't be
/// relied on to be consistent.		/// relied on to be consistent.
bool Linker::LinkModules(Module Dest, Module Src,		bool Linker::LinkModules(Module Dest, Module Src,
DiagnosticHandlerFunction DiagnosticHandler) {		DiagnosticHandlerFunction DiagnosticHandler,
		unsigned Flags) {
Linker L(Dest, DiagnosticHandler);		Linker L(Dest, DiagnosticHandler);
return L.linkInModule(Src);		return L.linkInModule(Src, Flags);
}		}

bool Linker::LinkModules(Module Dest, Module Src) {		bool Linker::LinkModules(Module Dest, Module Src, unsigned Flags) {
Linker L(Dest);		Linker L(Dest);
return L.linkInModule(Src);		return L.linkInModule(Src, Flags);
}		}

//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//
// C API.		// C API.
//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//

LLVMBool LLVMLinkModules(LLVMModuleRef Dest, LLVMModuleRef Src,		LLVMBool LLVMLinkModules(LLVMModuleRef Dest, LLVMModuleRef Src,
LLVMLinkerMode Unused, char **OutMessages) {		LLVMLinkerMode Unused, char **OutMessages) {
Show All 14 Lines

llvm/trunk/test/Linker/Inputs/linkage.c.ll

				@X = global i32 5
				@U = global i32 6
				define i32 @foo() { ret i32 7 }
				define i32 @unused() { ret i32 8 }

llvm/trunk/test/Linker/link-flags.ll

				; RUN: llvm-as %S/Inputs/linkage.b.ll -o %t.b.bc
				; RUN: llvm-as %S/Inputs/linkage.c.ll -o %t.c.bc
				; RUN: llvm-link -S %t.b.bc %t.c.bc \| FileCheck %s -check-prefix=B -check-prefix=C -check-prefix=CU
				; RUN: llvm-link -S -only-needed %t.b.bc %t.c.bc \| FileCheck %s -check-prefix=B -check-prefix=C -check-prefix=CN
				; RUN: llvm-link -S -internalize %t.b.bc %t.c.bc \| FileCheck %s -check-prefix=B -check-prefix=CI
				; RUN: llvm-link -S -internalize -only-needed %t.b.bc %t.c.bc \| FileCheck %s -check-prefix=B -check-prefix=CN

				C-LABEL: @X = global i32 5
				CI-LABEL: @X = internal global i32 5
				CU-LABEL:@U = global i32 6
				CI-LABEL:@U = internal global i32 6
				CN-LABEL-NOT:@U

				B-LABEL: define void @bar() {

				C-LABEL: define i32 @foo()
				CI-LABEL: define internal i32 @foo()

				CU-LABEL:define i32 @unused() {
				CI-LABEL:define internal i32 @unused() {
				CN-LABEL-NOT:@unused()

llvm/trunk/tools/llvm-link/llvm-link.cpp

Show First 20 Lines • Show All 42 Lines • ▼ Show 20 Lines	static cl::list<std::string> OverridingInputs(
cl::desc(		cl::desc(
"input bitcode file which can override previously defined symbol(s)"));		"input bitcode file which can override previously defined symbol(s)"));

static cl::opt<std::string>		static cl::opt<std::string>
OutputFilename("o", cl::desc("Override output filename"), cl::init("-"),		OutputFilename("o", cl::desc("Override output filename"), cl::init("-"),
cl::value_desc("filename"));		cl::value_desc("filename"));

static cl::opt<bool>		static cl::opt<bool>
		Internalize("internalize", cl::desc("Internalize linked symbols"));

		static cl::opt<bool>
		OnlyNeeded("only-needed", cl::desc("Link only needed symbols"));

		static cl::opt<bool>
Force("f", cl::desc("Enable binary output on terminals"));		Force("f", cl::desc("Enable binary output on terminals"));

static cl::opt<bool>		static cl::opt<bool>
OutputAssembly("S",		OutputAssembly("S",
cl::desc("Write output as LLVM assembly"), cl::Hidden);		cl::desc("Write output as LLVM assembly"), cl::Hidden);

static cl::opt<bool>		static cl::opt<bool>
Verbose("v", cl::desc("Print information about actions taken"));		Verbose("v", cl::desc("Print information about actions taken"));
▲ Show 20 Lines • Show All 50 Lines • ▼ Show 20 Lines	static void diagnosticHandler(const DiagnosticInfo &DI) {

DiagnosticPrinterRawOStream DP(errs());		DiagnosticPrinterRawOStream DP(errs());
DI.print(DP);		DI.print(DP);
errs() << '\n';		errs() << '\n';
}		}

static bool linkFiles(const char *argv0, LLVMContext &Context, Linker &L,		static bool linkFiles(const char *argv0, LLVMContext &Context, Linker &L,
const cl::list<std::string> &Files,		const cl::list<std::string> &Files,
bool OverrideDuplicateSymbols) {		unsigned Flags) {
		// Filter out flags that don't apply to the first file we load.
		unsigned ApplicableFlags = Flags & Linker::Flags::OverrideFromSrc;
for (const auto &File : Files) {		for (const auto &File : Files) {
std::unique_ptr<Module> M = loadFile(argv0, File, Context);		std::unique_ptr<Module> M = loadFile(argv0, File, Context);
if (!M.get()) {		if (!M.get()) {
errs() << argv0 << ": error loading file '" << File << "'\n";		errs() << argv0 << ": error loading file '" << File << "'\n";
return false;		return false;
}		}

if (verifyModule(*M, &errs())) {		if (verifyModule(*M, &errs())) {
errs() << argv0 << ": " << File << ": error: input module is broken!\n";		errs() << argv0 << ": " << File << ": error: input module is broken!\n";
return false;		return false;
}		}

if (Verbose)		if (Verbose)
errs() << "Linking in '" << File << "'\n";		errs() << "Linking in '" << File << "'\n";

if (L.linkInModule(M.get(), OverrideDuplicateSymbols))		if (L.linkInModule(M.get(), ApplicableFlags))
return false;		return false;
		// All linker flags apply to linking of subsequent files.
		ApplicableFlags = Flags;
}		}

return true;		return true;
}		}

int main(int argc, char **argv) {		int main(int argc, char **argv) {
// Print a stack trace if we signal out.		// Print a stack trace if we signal out.
sys::PrintStackTraceOnErrorSignal();		sys::PrintStackTraceOnErrorSignal();
PrettyStackTraceProgram X(argc, argv);		PrettyStackTraceProgram X(argc, argv);

LLVMContext &Context = getGlobalContext();		LLVMContext &Context = getGlobalContext();
llvm_shutdown_obj Y; // Call llvm_shutdown() on exit.		llvm_shutdown_obj Y; // Call llvm_shutdown() on exit.
cl::ParseCommandLineOptions(argc, argv, "llvm linker\n");		cl::ParseCommandLineOptions(argc, argv, "llvm linker\n");

auto Composite = make_unique<Module>("llvm-link", Context);		auto Composite = make_unique<Module>("llvm-link", Context);
Linker L(Composite.get(), diagnosticHandler);		Linker L(Composite.get(), diagnosticHandler);

		unsigned Flags = Linker::Flags::None;
		if (Internalize)
		Flags \|= Linker::Flags::InternalizeLinkedSymbols;
		if (OnlyNeeded)
		Flags \|= Linker::Flags::LinkOnlyNeeded;

// First add all the regular input files		// First add all the regular input files
if (!linkFiles(argv[0], Context, L, InputFilenames, false))		if (!linkFiles(argv[0], Context, L, InputFilenames, Flags))
return 1;		return 1;

// Next the -override ones.		// Next the -override ones.
if (!linkFiles(argv[0], Context, L, OverridingInputs, true))		if (!linkFiles(argv[0], Context, L, OverridingInputs,
		Flags \| Linker::Flags::OverrideFromSrc))
return 1;		return 1;

if (DumpAsm) errs() << "Here's the assembly:\n" << *Composite;		if (DumpAsm) errs() << "Here's the assembly:\n" << *Composite;

std::error_code EC;		std::error_code EC;
tool_output_file Out(OutputFilename, EC, sys::fs::F_None);		tool_output_file Out(OutputFilename, EC, sys::fs::F_None);
if (EC) {		if (EC) {
errs() << EC.message() << '\n';		errs() << EC.message() << '\n';
Show All 19 Lines

This is an archive of the discontinued LLVM Phabricator instance.

Implement selective bitcode linking and internalization of linked symbolsClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 33711

llvm/trunk/include/llvm/Linker/Linker.h

llvm/trunk/lib/Linker/LinkModules.cpp

llvm/trunk/test/Linker/Inputs/linkage.c.ll

llvm/trunk/test/Linker/link-flags.ll

llvm/trunk/tools/llvm-link/llvm-link.cpp

Implement selective bitcode linking and internalization of linked symbols
ClosedPublic