Diff 129479

wasm/InputChunks.h

Show First 20 Lines • Show All 124 Lines • ▼ Show 20 Lines	public:
uint32_t getOutputIndex() const { return OutputIndex.getValue(); };		uint32_t getOutputIndex() const { return OutputIndex.getValue(); };
bool hasOutputIndex() const { return OutputIndex.hasValue(); };		bool hasOutputIndex() const { return OutputIndex.hasValue(); };
void setOutputIndex(uint32_t Index) {		void setOutputIndex(uint32_t Index) {
assert(!hasOutputIndex());		assert(!hasOutputIndex());
OutputIndex = Index;		OutputIndex = Index;
};		};

const WasmSignature &Signature;		const WasmSignature &Signature;
		const WasmFunction &Function;

protected:		protected:
uint32_t getInputSectionOffset() const override {		uint32_t getInputSectionOffset() const override {
return Function.CodeSectionOffset;		return Function.CodeSectionOffset;
}		}
const WasmFunction &Function;
llvm::Optional<uint32_t> OutputIndex;		llvm::Optional<uint32_t> OutputIndex;
};		};

} // namespace wasm		} // namespace wasm
} // namespace lld		} // namespace lld

#endif // LLD_WASM_INPUT_CHUNKS_H		#endif // LLD_WASM_INPUT_CHUNKS_H

wasm/InputChunks.cpp

Show First 20 Lines • Show All 101 Lines • ▼ Show 20 Lines	for (const WasmRelocation &Reloc : Relocations) {
DEBUG(dbgs() << "reloc: type=" << Reloc.Type << " index=" << Reloc.Index		DEBUG(dbgs() << "reloc: type=" << Reloc.Type << " index=" << Reloc.Index
<< " offset=" << Reloc.Offset		<< " offset=" << Reloc.Offset
<< " newOffset=" << NewReloc.Reloc.Offset << "\n");		<< " newOffset=" << NewReloc.Reloc.Offset << "\n");

if (Config->EmitRelocs)		if (Config->EmitRelocs)
NewReloc.NewIndex = File.calcNewIndex(Reloc);		NewReloc.NewIndex = File.calcNewIndex(Reloc);

switch (Reloc.Type) {		switch (Reloc.Type) {
		case R_WEBASSEMBLY_TABLE_INDEX_I32:
		case R_WEBASSEMBLY_TABLE_INDEX_SLEB:
		NewReloc.Value = File.relocateTableIndex(Reloc.Index);
		break;
case R_WEBASSEMBLY_MEMORY_ADDR_SLEB:		case R_WEBASSEMBLY_MEMORY_ADDR_SLEB:
case R_WEBASSEMBLY_MEMORY_ADDR_I32:		case R_WEBASSEMBLY_MEMORY_ADDR_I32:
case R_WEBASSEMBLY_MEMORY_ADDR_LEB:		case R_WEBASSEMBLY_MEMORY_ADDR_LEB:
NewReloc.Value = File.getRelocatedAddress(Reloc.Index) + Reloc.Addend;		NewReloc.Value = File.getRelocatedAddress(Reloc.Index) + Reloc.Addend;
break;		break;
default:		default:
NewReloc.Value = File.calcNewIndex(Reloc);		NewReloc.Value = File.calcNewIndex(Reloc);
break;		break;
}		}

OutRelocations.emplace_back(NewReloc);		OutRelocations.emplace_back(NewReloc);
}		}
}		}

wasm/InputFiles.h

Show First 20 Lines • Show All 87 Lines • ▼ Show 20 Lines	public:

void parse() override;		void parse() override;

// Returns the underlying wasm file.		// Returns the underlying wasm file.
const WasmObjectFile *getWasmObj() const { return WasmObj.get(); }		const WasmObjectFile *getWasmObj() const { return WasmObj.get(); }

void dumpInfo() const;		void dumpInfo() const;

uint32_t relocateFunctionIndex(uint32_t Original) const;		uint32_t relocateFunctionSymbolIndex(uint32_t Original) const;
uint32_t getRelocatedAddress(uint32_t Index) const;		uint32_t getRelocatedAddress(uint32_t Index) const;
uint32_t calcNewIndex(const WasmRelocation &Reloc) const;		uint32_t calcNewIndex(const WasmRelocation &Reloc) const;

const WasmSection *CodeSection = nullptr;		const WasmSection *CodeSection = nullptr;
const WasmSection *DataSection = nullptr;		const WasmSection *DataSection = nullptr;

std::vector<uint32_t> TypeMap;		std::vector<uint32_t> TypeMap;
std::vector<InputSegment *> Segments;		std::vector<InputSegment *> Segments;
std::vector<InputFunction *> Functions;		std::vector<InputFunction *> Functions;

ArrayRef<Symbol *> getSymbols() { return Symbols; }		ArrayRef<Symbol *> getSymbols() const { return Symbols; }
ArrayRef<Symbol *> getTableSymbols() { return TableSymbols; }		ArrayRef<Symbol *> getFunctionSymbols() const { return FunctionSymbols; }

private:		private:
uint32_t relocateTypeIndex(uint32_t Original) const;		uint32_t relocateTypeIndex(uint32_t Original) const;
uint32_t relocateGlobalIndex(uint32_t Original) const;		uint32_t relocateGlobalSymbolIndex(uint32_t Original) const;
uint32_t relocateTableIndex(uint32_t Original) const;		uint32_t relocateTableIndex(uint32_t Original) const;

Symbol *createDefined(const WasmSymbol &Sym, Symbol::Kind Kind,		Symbol *createDefined(const WasmSymbol &Sym, Symbol::Kind Kind,
const InputSegment *Segment = nullptr,		const InputSegment *Segment = nullptr,
InputFunction *Function = nullptr,		InputFunction *Function = nullptr,
uint32_t Address = UINT32_MAX);		uint32_t Address = UINT32_MAX);
Symbol *createUndefined(const WasmSymbol &Sym, Symbol::Kind Kind,		Symbol *createUndefined(const WasmSymbol &Sym, Symbol::Kind Kind,
const WasmSignature *Signature = nullptr);		const WasmSignature *Signature = nullptr);
void initializeSymbols();		void initializeSymbols();
InputSegment *getSegment(const WasmSymbol &WasmSym) const;		InputSegment *getSegment(const WasmSymbol &WasmSym) const;
const WasmSignature *getFunctionSig(const WasmSymbol &Sym) const;		const WasmSignature *getFunctionSig(const WasmSymbol &Sym) const;
uint32_t getGlobalValue(const WasmSymbol &Sym) const;		uint32_t getGlobalValue(const WasmSymbol &Sym) const;
InputFunction *getFunction(const WasmSymbol &Sym) const;		InputFunction *getFunction(const WasmSymbol &Sym) const;
bool isExcludedByComdat(InputChunk *Chunk) const;		bool isExcludedByComdat(InputChunk *Chunk) const;

// List of all symbols referenced or defined by this file.		// List of all symbols referenced or defined by this file.
std::vector<Symbol *> Symbols;		std::vector<Symbol *> Symbols;

// List of all function symbols indexed by the function index space		// List of all function symbols indexed by the function Symbol index space,
		// that is, function imports followed by function exports (not the Wasm
		// function definition index space, function imports followed by function
		// bodies).
std::vector<Symbol *> FunctionSymbols;		std::vector<Symbol *> FunctionSymbols;

// List of all global symbols indexed by the global index space		// List of all global symbols indexed by the global Symbol index space,
		// that is, global imports followed by global exports (not the Wasm
		// global definition index space, global imports followed by global
		// definitions).
std::vector<Symbol *> GlobalSymbols;		std::vector<Symbol *> GlobalSymbols;

// List of all indirect symbols indexed by table index space.
std::vector<Symbol *> TableSymbols;

uint32_t NumGlobalImports = 0;		uint32_t NumGlobalImports = 0;
uint32_t NumFunctionImports = 0;		uint32_t NumFunctionImports = 0;
		uint32_t NumGlobalExports = 0;
		uint32_t NumFunctionExports = 0;
std::unique_ptr<WasmObjectFile> WasmObj;		std::unique_ptr<WasmObjectFile> WasmObj;
};		};

// Opens a given file.		// Opens a given file.
llvm::Optional<MemoryBufferRef> readFile(StringRef Path);		llvm::Optional<MemoryBufferRef> readFile(StringRef Path);

} // namespace wasm		} // namespace wasm

std::string toString(const wasm::InputFile *File);		std::string toString(const wasm::InputFile *File);

} // namespace lld		} // namespace lld

#endif		#endif

wasm/InputFiles.cpp

Show First 20 Lines • Show All 41 Lines • ▼ Show 20 Lines	Optional<MemoryBufferRef> lld::wasm::readFile(StringRef Path) {
return MBRef;		return MBRef;
}		}

void ObjFile::dumpInfo() const {		void ObjFile::dumpInfo() const {
log("info for: " + getName() + "\n" +		log("info for: " + getName() + "\n" +
" Total Functions : " + Twine(FunctionSymbols.size()) + "\n" +		" Total Functions : " + Twine(FunctionSymbols.size()) + "\n" +
" Total Globals : " + Twine(GlobalSymbols.size()) + "\n" +		" Total Globals : " + Twine(GlobalSymbols.size()) + "\n" +
" Function Imports : " + Twine(NumFunctionImports) + "\n" +		" Function Imports : " + Twine(NumFunctionImports) + "\n" +
" Global Imports : " + Twine(NumGlobalImports) + "\n" +		" Global Imports : " + Twine(NumGlobalImports) + "\n");
" Table Entries : " + Twine(TableSymbols.size()) + "\n");
}		}

uint32_t ObjFile::getRelocatedAddress(uint32_t GlobalIndex) const {		uint32_t ObjFile::getRelocatedAddress(uint32_t GlobalIndex) const {
return GlobalSymbols[GlobalIndex]->getVirtualAddress();		return GlobalSymbols[GlobalIndex]->getVirtualAddress();
}		}

uint32_t ObjFile::relocateFunctionIndex(uint32_t Original) const {		uint32_t ObjFile::relocateTypeIndex(uint32_t Original) const {
		return TypeMap[Original];
		}

		uint32_t ObjFile::relocateFunctionSymbolIndex(uint32_t Original) const {
Symbol *Sym = FunctionSymbols[Original];		Symbol *Sym = FunctionSymbols[Original];
uint32_t Index = Sym->getOutputIndex();		uint32_t Index = Sym->getOutputIndex();
DEBUG(dbgs() << "relocateFunctionIndex: " << toString(*Sym) << ": "		DEBUG(dbgs() << "relocateFunctionSymbolIndex: " << toString(*Sym) << ": "
<< Original << " -> " << Index << "\n");		<< Original << " -> " << Index << "\n");
return Index;		return Index;
}		}

uint32_t ObjFile::relocateTypeIndex(uint32_t Original) const {		uint32_t ObjFile::relocateGlobalSymbolIndex(uint32_t Original) const {
return TypeMap[Original];		Symbol *Sym = GlobalSymbols[Original];
		uint32_t Index = Sym->hasOutputIndex() ? Sym->getOutputIndex() : 0;
		DEBUG(dbgs() << "relocateGlobalSymbolIndex: " << toString(*Sym) << ": " << Original
		<< " -> " << Index << "\n");
		return Index;
}		}

uint32_t ObjFile::relocateTableIndex(uint32_t Original) const {		uint32_t ObjFile::relocateTableIndex(uint32_t Original) const {
Symbol *Sym = TableSymbols[Original];		Symbol *Sym = FunctionSymbols[Original];
uint32_t Index = Sym->hasTableIndex() ? Sym->getTableIndex() : 0;		uint32_t Index = Sym->hasTableIndex() ? Sym->getTableIndex() : 0;
DEBUG(dbgs() << "relocateTableIndex: " << toString(*Sym) << ": " << Original		DEBUG(dbgs() << "relocateTableIndex: " << toString(*Sym) << ": " << Original
<< " -> " << Index << "\n");		<< " -> " << Index << "\n");
return Index;		return Index;
}		}

uint32_t ObjFile::relocateGlobalIndex(uint32_t Original) const {
Symbol *Sym = GlobalSymbols[Original];
uint32_t Index = Sym->hasOutputIndex() ? Sym->getOutputIndex() : 0;
DEBUG(dbgs() << "relocateGlobalIndex: " << toString(*Sym) << ": " << Original
<< " -> " << Index << "\n");
return Index;
}

// Relocations contain an index into the function, global or table index		// Relocations contain an index into the function, global or table index
// space of the input file. This function takes a relocation and returns the		// space of the input file. This function takes a relocation and returns the
// relocated index (i.e. translates from the input index space to the output		// relocated index (i.e. translates from the input index space to the output
// index space).		// index space).
uint32_t ObjFile::calcNewIndex(const WasmRelocation &Reloc) const {		uint32_t ObjFile::calcNewIndex(const WasmRelocation &Reloc) const {
switch (Reloc.Type) {		switch (Reloc.Type) {
case R_WEBASSEMBLY_TYPE_INDEX_LEB:		case R_WEBASSEMBLY_TYPE_INDEX_LEB:
return relocateTypeIndex(Reloc.Index);		return relocateTypeIndex(Reloc.Index);
case R_WEBASSEMBLY_FUNCTION_INDEX_LEB:		case R_WEBASSEMBLY_FUNCTION_INDEX_LEB:
return relocateFunctionIndex(Reloc.Index);
case R_WEBASSEMBLY_TABLE_INDEX_I32:		case R_WEBASSEMBLY_TABLE_INDEX_I32:
case R_WEBASSEMBLY_TABLE_INDEX_SLEB:		case R_WEBASSEMBLY_TABLE_INDEX_SLEB:
return relocateTableIndex(Reloc.Index);		return relocateFunctionSymbolIndex(Reloc.Index);
case R_WEBASSEMBLY_GLOBAL_INDEX_LEB:		case R_WEBASSEMBLY_GLOBAL_INDEX_LEB:
case R_WEBASSEMBLY_MEMORY_ADDR_LEB:		case R_WEBASSEMBLY_MEMORY_ADDR_LEB:
case R_WEBASSEMBLY_MEMORY_ADDR_SLEB:		case R_WEBASSEMBLY_MEMORY_ADDR_SLEB:
case R_WEBASSEMBLY_MEMORY_ADDR_I32:		case R_WEBASSEMBLY_MEMORY_ADDR_I32:
return relocateGlobalIndex(Reloc.Index);		return relocateGlobalSymbolIndex(Reloc.Index);
default:		default:
llvm_unreachable("unknown relocation type");		llvm_unreachable("unknown relocation type");
}		}
}		}

void ObjFile::parse() {		void ObjFile::parse() {
// Parse a memory buffer as a wasm file.		// Parse a memory buffer as a wasm file.
DEBUG(dbgs() << "Parsing object: " << toString(this) << "\n");		DEBUG(dbgs() << "Parsing object: " << toString(this) << "\n");
Show All 34 Lines	InputSegment *ObjFile::getSegment(const WasmSymbol &WasmSym) const {
}		}
error("symbol not found in any segment: " + WasmSym.Name);		error("symbol not found in any segment: " + WasmSym.Name);
return nullptr;		return nullptr;
}		}

// Get the value stored in the wasm global represented by this symbol.		// Get the value stored in the wasm global represented by this symbol.
// This represents the virtual address of the symbol in the input file.		// This represents the virtual address of the symbol in the input file.
uint32_t ObjFile::getGlobalValue(const WasmSymbol &Sym) const {		uint32_t ObjFile::getGlobalValue(const WasmSymbol &Sym) const {
		assert(Sym.WasmIndex >= getWasmObj()->getNumImportedGlobals());
const WasmGlobal &Global =		const WasmGlobal &Global =
getWasmObj()->globals()[Sym.ElementIndex - NumGlobalImports];		getWasmObj()->globals()[Sym.WasmIndex - NumGlobalImports];
assert(Global.Type == llvm::wasm::WASM_TYPE_I32);		assert(Global.Type == llvm::wasm::WASM_TYPE_I32);
return Global.InitExpr.Value.Int32;		return Global.InitExpr.Value.Int32;
}		}

// Get the signature for a given function symbol, either by looking		// Get the signature for a given function symbol, either by looking
// it up in function sections (for defined functions), of the imports section		// it up in function sections (for defined functions), of the imports section
// (for imported functions).		// (for imported functions).
const WasmSignature *ObjFile::getFunctionSig(const WasmSymbol &Sym) const {		const WasmSignature *ObjFile::getFunctionSig(const WasmSymbol &Sym) const {
DEBUG(dbgs() << "getFunctionSig: " << Sym.Name << "\n");		DEBUG(dbgs() << "getFunctionSig: " << Sym.Name << "\n");
return &WasmObj->types()[Sym.FunctionType];		return &WasmObj->types()[Sym.FunctionType];
}		}

InputFunction *ObjFile::getFunction(const WasmSymbol &Sym) const {		InputFunction *ObjFile::getFunction(const WasmSymbol &Sym) const {
uint32_t FunctionIndex = Sym.ElementIndex - NumFunctionImports;		assert(Sym.WasmIndex >= NumFunctionImports);
		uint32_t FunctionIndex = Sym.WasmIndex - NumFunctionImports;
return Functions[FunctionIndex];		return Functions[FunctionIndex];
}		}

bool ObjFile::isExcludedByComdat(InputChunk *Chunk) const {		bool ObjFile::isExcludedByComdat(InputChunk *Chunk) const {
StringRef Comdat = Chunk->getComdat();		StringRef Comdat = Chunk->getComdat();
return !Comdat.empty() && Symtab->findComdat(Comdat) != this;		return !Comdat.empty() && Symtab->findComdat(Comdat) != this;
}		}

void ObjFile::initializeSymbols() {		void ObjFile::initializeSymbols() {
Symbols.reserve(WasmObj->getNumberOfSymbols());		Symbols.reserve(WasmObj->getNumberOfSymbols());

for (const WasmImport &Import : WasmObj->imports()) {		NumFunctionImports = WasmObj->getNumImportedFunctions();
switch (Import.Kind) {		NumGlobalImports = WasmObj->getNumImportedGlobals();
case WASM_EXTERNAL_FUNCTION:		NumFunctionExports = WasmObj->getNumExportedFunctions();
++NumFunctionImports;		NumGlobalExports = WasmObj->getNumExportedGlobals();
break;
case WASM_EXTERNAL_GLOBAL:
++NumGlobalImports;
break;
}
}

ArrayRef<WasmFunction> Funcs = WasmObj->functions();		ArrayRef<WasmFunction> Funcs = WasmObj->functions();
ArrayRef<uint32_t> FuncTypes = WasmObj->functionTypes();		ArrayRef<uint32_t> FuncTypes = WasmObj->functionTypes();
ArrayRef<WasmSignature> Types = WasmObj->types();		ArrayRef<WasmSignature> Types = WasmObj->types();
ArrayRef<WasmGlobal> Globals = WasmObj->globals();		ArrayRef<WasmGlobal> Globals = WasmObj->globals();

for (const auto &C : WasmObj->comdats())		for (const auto &C : WasmObj->comdats())
Symtab->addComdat(C, this);		Symtab->addComdat(C, this);
▲ Show 20 Lines • Show All 45 Lines • ▼ Show 20 Lines	case WasmSymbol::SymbolType::GLOBAL_EXPORT: {
} else {		} else {
Segment->Discarded = true;		Segment->Discarded = true;
// fall through:		// fall through:
}		}
}		}
case WasmSymbol::SymbolType::GLOBAL_IMPORT:		case WasmSymbol::SymbolType::GLOBAL_IMPORT:
S = createUndefined(WasmSym, Symbol::Kind::UndefinedGlobalKind);		S = createUndefined(WasmSym, Symbol::Kind::UndefinedGlobalKind);
break;		break;
case WasmSymbol::SymbolType::DEBUG_FUNCTION_NAME:
// These are for debugging only, no need to create linker symbols for them
continue;
}		}

Symbols.push_back(S);		Symbols.push_back(S);
if (WasmSym.isFunction()) {		if (WasmSym.isFunction()) {
DEBUG(dbgs() << "Function: " << WasmSym.ElementIndex << " -> "		DEBUG(dbgs() << "Function: " << WasmSym.SymbolIndex << " -> "
<< toString(*S) << "\n");		<< toString(*S) << "\n");
FunctionSymbols[WasmSym.ElementIndex] = S;		FunctionSymbols[WasmSym.SymbolIndex] = S;
if (WasmSym.HasAltIndex)		InputFunction &Func = *Functions[WasmSym.WasmIndex - NumFunctionImports];
FunctionSymbols[WasmSym.AltIndex] = S;
} else {		} else {
DEBUG(dbgs() << "Global: " << WasmSym.ElementIndex << " -> "		DEBUG(dbgs() << "Global: " << WasmSym.SymbolIndex << " -> "
<< toString(*S) << "\n");		<< toString(*S) << "\n");
GlobalSymbols[WasmSym.ElementIndex] = S;		GlobalSymbols[WasmSym.SymbolIndex] = S;
if (WasmSym.HasAltIndex)
GlobalSymbols[WasmSym.AltIndex] = S;
}		}
}		}

DEBUG(for (size_t I = 0; I < FunctionSymbols.size(); ++I)		DEBUG(for (size_t I = 0; I < FunctionSymbols.size(); ++I)
assert(FunctionSymbols[I] != nullptr);		assert(FunctionSymbols[I] != nullptr);
for (size_t I = 0; I < GlobalSymbols.size(); ++I)		for (size_t I = 0; I < GlobalSymbols.size(); ++I)
assert(GlobalSymbols[I] != nullptr););		assert(GlobalSymbols[I] != nullptr););

// Populate `TableSymbols` with all symbols that are called indirectly
uint32_t SegmentCount = WasmObj->elements().size();
if (SegmentCount) {
if (SegmentCount > 1)
fatal(getName() + ": contains more than one element segment");
const WasmElemSegment &Segment = WasmObj->elements()[0];
if (Segment.Offset.Opcode != WASM_OPCODE_I32_CONST)
fatal(getName() + ": unsupported element segment");
if (Segment.TableIndex != 0)
fatal(getName() + ": unsupported table index in elem segment");
if (Segment.Offset.Value.Int32 != 0)
fatal(getName() + ": unsupported element segment offset");
TableSymbols.reserve(Segment.Functions.size());
for (uint64_t FunctionIndex : Segment.Functions)
TableSymbols.push_back(FunctionSymbols[FunctionIndex]);
}

DEBUG(dbgs() << "TableSymbols: " << TableSymbols.size() << "\n");
DEBUG(dbgs() << "Functions : " << FunctionSymbols.size() << "\n");		DEBUG(dbgs() << "Functions : " << FunctionSymbols.size() << "\n");
DEBUG(dbgs() << "Globals : " << GlobalSymbols.size() << "\n");		DEBUG(dbgs() << "Globals : " << GlobalSymbols.size() << "\n");
}		}

Symbol *ObjFile::createUndefined(const WasmSymbol &Sym, Symbol::Kind Kind,		Symbol *ObjFile::createUndefined(const WasmSymbol &Sym, Symbol::Kind Kind,
const WasmSignature *Signature) {		const WasmSignature *Signature) {
return Symtab->addUndefined(Sym.Name, Kind, Sym.Flags, this, Signature);		return Symtab->addUndefined(Sym.Name, Kind, Sym.Flags, this, Signature);
}		}
▲ Show 20 Lines • Show All 66 Lines • Show Last 20 Lines

wasm/Symbols.h

Show All 33 Lines	enum Kind {
UndefinedFunctionKind,		UndefinedFunctionKind,
UndefinedGlobalKind,		UndefinedGlobalKind,

LastDefinedKind = DefinedGlobalKind,		LastDefinedKind = DefinedGlobalKind,
InvalidKind,		InvalidKind,
};		};

Symbol(StringRef Name, uint32_t Flags)		Symbol(StringRef Name, uint32_t Flags)
: WrittenToSymtab(0), WrittenToNameSec(0), Flags(Flags), Name(Name) {}		: Flags(Flags), Name(Name) {}

Kind getKind() const { return SymbolKind; }		Kind getKind() const { return SymbolKind; }

bool isLazy() const { return SymbolKind == LazyKind; }		bool isLazy() const { return SymbolKind == LazyKind; }
bool isDefined() const { return SymbolKind <= LastDefinedKind; }		bool isDefined() const { return SymbolKind <= LastDefinedKind; }
bool isUndefined() const {		bool isUndefined() const {
return SymbolKind == UndefinedGlobalKind \|\|		return SymbolKind == UndefinedGlobalKind \|\|
SymbolKind == UndefinedFunctionKind;		SymbolKind == UndefinedFunctionKind;
Show All 17 Lines	public:
const WasmSignature &getFunctionType() const;		const WasmSignature &getFunctionType() const;
void setFunctionType(const WasmSignature *Type);		void setFunctionType(const WasmSignature *Type);

uint32_t getOutputIndex() const;		uint32_t getOutputIndex() const;

// Returns true if an output index has been set for this symbol		// Returns true if an output index has been set for this symbol
bool hasOutputIndex() const;		bool hasOutputIndex() const;

// Set the output index of the symbol (in the function or global index		// Set the output index of the symbol, in the function or global Wasm
// space of the output object.		// index space of the output object - that is, for defined symbols only,
		// its position in the list of defined function bodies / global decls.
void setOutputIndex(uint32_t Index);		void setOutputIndex(uint32_t Index);

uint32_t getTableIndex() const { return TableIndex.getValue(); }		uint32_t getTableIndex() const { return TableIndex.getValue(); }

// Returns true if a table index has been set for this symbol		// Returns true if a table index has been set for this symbol
bool hasTableIndex() const { return TableIndex.hasValue(); }		bool hasTableIndex() const { return TableIndex.hasValue(); }

// Set the table index of the symbol		// Set the table index of the symbol
void setTableIndex(uint32_t Index);		void setTableIndex(uint32_t Index);

// Returns the virtual address of a defined global.		// Returns the virtual address of a defined global.
// Only works for globals, not functions.		// Only works for globals, not functions.
uint32_t getVirtualAddress() const;		uint32_t getVirtualAddress() const;

void setVirtualAddress(uint32_t VA);		void setVirtualAddress(uint32_t VA);

void update(Kind K, InputFile *F = nullptr, uint32_t Flags = 0,		void update(Kind K, InputFile *F = nullptr, uint32_t Flags = 0,
const InputSegment *Segment = nullptr,		const InputSegment *Segment = nullptr,
const InputFunction *Function = nullptr,		const InputFunction *Function = nullptr,
uint32_t Address = UINT32_MAX);		uint32_t Address = UINT32_MAX);

void setArchiveSymbol(const Archive::Symbol &Sym) { ArchiveSymbol = Sym; }		void setArchiveSymbol(const Archive::Symbol &Sym) { ArchiveSymbol = Sym; }
const Archive::Symbol &getArchiveSymbol() { return ArchiveSymbol; }		const Archive::Symbol &getArchiveSymbol() { return ArchiveSymbol; }

// This bit is used by Writer::writeNameSection() to prevent
// symbols from being written to the symbol table more than once.
unsigned WrittenToSymtab : 1;
unsigned WrittenToNameSec : 1;

protected:		protected:
uint32_t Flags;		uint32_t Flags;
uint32_t VirtualAddress = 0;		uint32_t VirtualAddress = 0;

StringRef Name;		StringRef Name;
Archive::Symbol ArchiveSymbol = {nullptr, 0, 0};		Archive::Symbol ArchiveSymbol = {nullptr, 0, 0};
Kind SymbolKind = InvalidKind;		Kind SymbolKind = InvalidKind;
InputFile *File = nullptr;		InputFile *File = nullptr;
Show All 16 Lines

wasm/Writer.cpp

Show First 20 Lines • Show All 67 Lines • ▼ Show 20 Lines

private:		private:
void openFile();		void openFile();

uint32_t lookupType(const WasmSignature &Sig);		uint32_t lookupType(const WasmSignature &Sig);
uint32_t registerType(const WasmSignature &Sig);		uint32_t registerType(const WasmSignature &Sig);
void assignIndexes();		void assignIndexes();
void calculateImports();		void calculateImports();
void calculateOffsets();
void calculateTypes();		void calculateTypes();
void createOutputSegments();		void createOutputSegments();
void layoutMemory();		void layoutMemory();
void createHeader();		void createHeader();
void createSections();		void createSections();
SyntheticSection *createSyntheticSection(uint32_t Type,		SyntheticSection *createSyntheticSection(uint32_t Type,
StringRef Name = "");		StringRef Name = "");

Show All 16 Lines	private:
void createNameSection();		void createNameSection();

void writeHeader();		void writeHeader();
void writeSections();		void writeSections();

uint64_t FileSize = 0;		uint64_t FileSize = 0;
uint32_t DataSize = 0;		uint32_t DataSize = 0;
uint32_t NumMemoryPages = 0;		uint32_t NumMemoryPages = 0;
uint32_t InitialTableOffset = 0;		uint32_t InitialTableOffset = 1;

std::vector<const WasmSignature *> Types;		std::vector<const WasmSignature *> Types;
DenseMap<WasmSignature, int32_t, WasmSignatureDenseMapInfo> TypeIndices;		DenseMap<WasmSignature, int32_t, WasmSignatureDenseMapInfo> TypeIndices;
std::vector<const Symbol *> ImportedFunctions;		std::vector<const Symbol *> ImportedFunctions;
std::vector<const Symbol *> ImportedGlobals;		std::vector<const Symbol *> ImportedGlobals;
std::vector<const Symbol *> DefinedGlobals;		std::vector<const Symbol *> DefinedGlobals;
std::vector<InputFunction *> DefinedFunctions;		std::vector<InputFunction *> DefinedFunctions;
std::vector<const Symbol *> IndirectFunctions;		std::vector<const Symbol *> IndirectFunctions;
▲ Show 20 Lines • Show All 294 Lines • ▼ Show 20 Lines	void Writer::createLinkingSection() {
}		}

std::vector<WasmInitFunc> InitFunctions;		std::vector<WasmInitFunc> InitFunctions;
for (ObjFile *File : Symtab->ObjectFiles) {		for (ObjFile *File : Symtab->ObjectFiles) {
const WasmLinkingData &L = File->getWasmObj()->linkingData();		const WasmLinkingData &L = File->getWasmObj()->linkingData();
InitFunctions.reserve(InitFunctions.size() + L.InitFunctions.size());		InitFunctions.reserve(InitFunctions.size() + L.InitFunctions.size());
for (const WasmInitFunc &F : L.InitFunctions)		for (const WasmInitFunc &F : L.InitFunctions)
InitFunctions.emplace_back(WasmInitFunc{		InitFunctions.emplace_back(WasmInitFunc{
F.Priority, File->relocateFunctionIndex(F.FunctionIndex)});		F.Priority, File->relocateFunctionSymbolIndex(F.FunctionIndex)});
}		}

if (!InitFunctions.empty()) {		if (!InitFunctions.empty()) {
SubSection SubSection(WASM_INIT_FUNCS);		SubSection SubSection(WASM_INIT_FUNCS);
writeUleb128(SubSection.getStream(), InitFunctions.size(),		writeUleb128(SubSection.getStream(), InitFunctions.size(),
"num init functionsw");		"num init functions");
for (const WasmInitFunc &F : InitFunctions) {		for (const WasmInitFunc &F : InitFunctions) {
writeUleb128(SubSection.getStream(), F.Priority, "priority");		writeUleb128(SubSection.getStream(), F.Priority, "priority");
writeUleb128(SubSection.getStream(), F.FunctionIndex, "function index");		writeUleb128(SubSection.getStream(), F.FunctionIndex, "function index");
}		}
SubSection.finalizeContents();		SubSection.finalizeContents();
SubSection.writeToStream(OS);		SubSection.writeToStream(OS);
}		}

Show All 31 Lines	if (!Comdats.empty()) {
}		}
SubSection.finalizeContents();		SubSection.finalizeContents();
SubSection.writeToStream(OS);		SubSection.writeToStream(OS);
}		}
}		}

// Create the custom "name" section containing debug symbol names.		// Create the custom "name" section containing debug symbol names.
void Writer::createNameSection() {		void Writer::createNameSection() {
// Create an array of all function sorted by function index space		unsigned Names = 0;
std::vector<const Symbol *> Names;		for (const InputFunction *F : DefinedFunctions)
		if (!F->Function.Name.empty())
for (ObjFile *File : Symtab->ObjectFiles) {		++Names;
Names.reserve(Names.size() + File->getSymbols().size());
for (Symbol *S : File->getSymbols()) {
if (!S->isFunction() \|\| S->isWeak() \|\| S->WrittenToNameSec)
continue;
S->WrittenToNameSec = true;
Names.emplace_back(S);
}
}

SyntheticSection *Section = createSyntheticSection(WASM_SEC_CUSTOM, "name");		SyntheticSection *Section = createSyntheticSection(WASM_SEC_CUSTOM, "name");

std::sort(Names.begin(), Names.end(), [](const Symbol A, const Symbol B) {
return A->getOutputIndex() < B->getOutputIndex();
});

SubSection FunctionSubsection(WASM_NAMES_FUNCTION);		SubSection FunctionSubsection(WASM_NAMES_FUNCTION);
raw_ostream &OS = FunctionSubsection.getStream();		raw_ostream &OS = FunctionSubsection.getStream();
writeUleb128(OS, Names.size(), "name count");		writeUleb128(OS, Names, "name count");

// We have to iterate through the inputs twice so that all the imports		for (const InputFunction *F : DefinedFunctions) {
// appear first before any of the local function names.		if (!F->Function.Name.empty()) {
for (const Symbol *S : Names) {		writeUleb128(OS, F->getOutputIndex(), "func index");
writeUleb128(OS, S->getOutputIndex(), "func index");		writeStr(OS, F->Function.Name, "symbol name");
writeStr(OS, S->getName(), "symbol name");		}
}		}

FunctionSubsection.finalizeContents();		FunctionSubsection.finalizeContents();
FunctionSubsection.writeToStream(Section->getStream());		FunctionSubsection.writeToStream(Section->getStream());
}		}

void Writer::writeHeader() {		void Writer::writeHeader() {
memcpy(Buffer->getBufferStart(), Header.data(), Header.size());		memcpy(Buffer->getBufferStart(), Header.data(), Header.size());
▲ Show 20 Lines • Show All 92 Lines • ▼ Show 20 Lines	if (Sym->isFunction()) {
ImportedFunctions.push_back(Sym);		ImportedFunctions.push_back(Sym);
} else {		} else {
Sym->setOutputIndex(ImportedGlobals.size());		Sym->setOutputIndex(ImportedGlobals.size());
ImportedGlobals.push_back(Sym);		ImportedGlobals.push_back(Sym);
}		}
}		}
}		}

uint32_t Writer::lookupType(const WasmSignature &Sig) {		uint32_t Writer::lookupType(const WasmSignature &Sig) {
auto It = TypeIndices.find(Sig);		auto It = TypeIndices.find(Sig);
if (It == TypeIndices.end()) {		if (It == TypeIndices.end()) {
error("type not found: " + toString(Sig));		error("type not found: " + toString(Sig));
return 0;		return 0;
}		}
return It->second;		return It->second;
}		}

uint32_t Writer::registerType(const WasmSignature &Sig) {		uint32_t Writer::registerType(const WasmSignature &Sig) {
auto Pair = TypeIndices.insert(std::make_pair(Sig, Types.size()));		auto Pair = TypeIndices.insert(std::make_pair(Sig, Types.size()));
if (Pair.second) {		if (Pair.second) {
DEBUG(dbgs() << "type " << toString(Sig) << "\n");		DEBUG(dbgs() << "type " << toString(Sig) << "\n");
Types.push_back(&Sig);		Types.push_back(&Sig);
}		}
return Pair.first->second;		return Pair.first->second;
}		}

void Writer::calculateTypes() {		void Writer::calculateTypes() {
for (ObjFile *File : Symtab->ObjectFiles) {		for (ObjFile *File : Symtab->ObjectFiles) {
File->TypeMap.reserve(File->getWasmObj()->types().size());		File->TypeMap.reserve(File->getWasmObj()->types().size());
for (const WasmSignature &Sig : File->getWasmObj()->types())		for (const WasmSignature &Sig : File->getWasmObj()->types())
File->TypeMap.push_back(registerType(Sig));		File->TypeMap.push_back(registerType(Sig));
}		}
}		}
		ruiuUnsubmitted Not Done Reply Inline Actions This is not related to this particular patch, but since I found this in this patch, I'll write the comment here. This piece of code is alarming because it uses hash tables. In general, in lld, I'd strongly recommend not to use hash tables or anything that is more complicated than the vector, because hash tables can make the linker noticeably slower. If you really need to use a hash table, please look it up only once for a new piece of data, just like we do in the SymbolTable. In SymbolTable, we do lookup a new symbol name in the hash table only once to obtain a pointer, and after that, we access the symbols through the pointer. We never look up the symbol table more than once for the same data to minimize the cost of hash table lookup. I designed everything in lld that way, and that is I believe one of the big reasons why lld is so fast. I'm not sure if it is applicable to this piece of code. If you have a small number of types and look the hash table only a few times, that's perhaps fine. But if each function have a type, and you need to insert/look up a hash table for each function, that's too much. If that's the case, could you revisit this code and redesign? ruiu: This is not related to this particular patch, but since I found this in this patch, I'll write…
		sbc100Unsubmitted Not Done Reply Inline Actions Yes, I think we can eliminate lookupType completely once the symbol table changes land. We can just have the TypeIndex from each symbol as we call registerType. sbc100: Yes, I think we can eliminate lookupType completely once the symbol table changes land. We…
		ncwAuthorUnsubmitted Not Done Reply Inline Actions In fact I remember making the same change in WasmObjectWriter (then reverting it), using a vector of bool to store whether something had been allocated rather than a DenseMap. In LLD there are a few hash map lookups we've added I'm afraid :( In fact COMDAT is another one, I think I can rid of the hashmap LLD uses for that as well. That was my fault, before I realised hash maps were forbidden. ncw: In fact I remember making the same change in WasmObjectWriter (then reverting it), using a…
		ruiuUnsubmitted Not Done Reply Inline Actions It's not forbidden. :) For example SymbolTable is a valid use of the hash table -- I can't think of any way to avoid hash table in that class. But it is strongly discouraged because it sometimes has a significant performance impact. ruiu: It's not forbidden. :) For example SymbolTable is a valid use of the hash table -- I can't…

void Writer::assignIndexes() {		void Writer::assignIndexes() {
uint32_t GlobalIndex = ImportedGlobals.size();		uint32_t GlobalIndex = ImportedGlobals.size();
uint32_t FunctionIndex = ImportedFunctions.size();		uint32_t FunctionIndex = ImportedFunctions.size();

if (Config->StackPointerSymbol) {		if (Config->StackPointerSymbol) {
DefinedGlobals.emplace_back(Config->StackPointerSymbol);		DefinedGlobals.emplace_back(Config->StackPointerSymbol);
Config->StackPointerSymbol->setOutputIndex(GlobalIndex++);		Config->StackPointerSymbol->setOutputIndex(GlobalIndex++);
Show All 27 Lines	for (InputFunction *Func : File->Functions) {
continue;		continue;
DefinedFunctions.emplace_back(Func);		DefinedFunctions.emplace_back(Func);
Func->setOutputIndex(FunctionIndex++);		Func->setOutputIndex(FunctionIndex++);
}		}
}		}

for (ObjFile *File : Symtab->ObjectFiles) {		for (ObjFile *File : Symtab->ObjectFiles) {
DEBUG(dbgs() << "Table Indexes: " << File->getName() << "\n");		DEBUG(dbgs() << "Table Indexes: " << File->getName() << "\n");
for (Symbol *Sym : File->getTableSymbols()) {		auto HandleRelocs = [&](ArrayRef<WasmRelocation> Relocations) {
		for (const WasmRelocation& Reloc : Relocations) {
		if (Reloc.Type != R_WEBASSEMBLY_TABLE_INDEX_I32 &&
		Reloc.Type != R_WEBASSEMBLY_TABLE_INDEX_SLEB)
		continue;
		Symbol *Sym = File->getFunctionSymbols()[Reloc.Index];
if (Sym->hasTableIndex() \|\| !Sym->hasOutputIndex())		if (Sym->hasTableIndex() \|\| !Sym->hasOutputIndex())
continue;		continue;
Sym->setTableIndex(TableIndex++);		Sym->setTableIndex(TableIndex++);
IndirectFunctions.emplace_back(Sym);		IndirectFunctions.emplace_back(Sym);
}		}
		};
		for (InputFunction* Func : File->Functions) {
		if (Func->Discarded)
		continue;
		HandleRelocs(Func->Relocations);
		}
		for (InputSegment* Seg : File->Segments) {
		if (Seg->Discarded)
		continue;
		HandleRelocs(Seg->Relocations);
		}
}		}
}		}

static StringRef getOutputDataSegmentName(StringRef Name) {		static StringRef getOutputDataSegmentName(StringRef Name) {
if (Config->Relocatable)		if (Config->Relocatable)
return Name;		return Name;

for (StringRef V :		for (StringRef V :
Show All 22 Lines	for (InputSegment *Segment : File->Segments) {
}		}
S->addInputSegment(Segment);		S->addInputSegment(Segment);
DEBUG(dbgs() << "added data: " << Name << ": " << S->Size << "\n");		DEBUG(dbgs() << "added data: " << Name << ": " << S->Size << "\n");
}		}
}		}
}		}

void Writer::run() {		void Writer::run() {
if (!Config->Relocatable)
InitialTableOffset = 1;

log("-- calculateTypes");		log("-- calculateTypes");
calculateTypes();		calculateTypes();
log("-- calculateImports");		log("-- calculateImports");
calculateImports();		calculateImports();
log("-- assignIndexes");		log("-- assignIndexes");
assignIndexes();		assignIndexes();

if (errorHandler().Verbose) {		if (errorHandler().Verbose) {
▲ Show 20 Lines • Show All 58 Lines • Show Last 20 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[WebAssembly] Add symbol table to LLD, 1/2
AbandonedPublic

Details

Diff Detail

Event Timeline

Problem #1

Problem #2

Conclusion

Revision Contents

Diff 129479

wasm/InputChunks.h

wasm/InputChunks.cpp

wasm/InputFiles.h

wasm/InputFiles.cpp

wasm/Symbols.h

wasm/Writer.cpp

This is an archive of the discontinued LLVM Phabricator instance.

[WebAssembly] Add symbol table to LLD, 1/2AbandonedPublic

Details

Diff Detail

Event Timeline

Problem #1

Problem #2

Conclusion

Revision Contents

Diff 129479

wasm/InputChunks.h

wasm/InputChunks.cpp

wasm/InputFiles.h

wasm/InputFiles.cpp

wasm/Symbols.h

wasm/Writer.cpp

[WebAssembly] Add symbol table to LLD, 1/2
AbandonedPublic