Index: ELF/LinkerScript.h =================================================================== --- ELF/LinkerScript.h +++ ELF/LinkerScript.h @@ -86,6 +86,7 @@ std::vector<StringRef> Phdrs; std::vector<uint8_t> Filler; ConstraintKind Constraint = ConstraintKind::NoConstraint; + bool HasSymbols = false; }; enum SortKind { SortNone, SortByName, SortByAlignment }; @@ -146,16 +147,12 @@ bool shouldKeep(InputSectionBase<ELFT> *S); void assignAddresses(); int compareSections(StringRef A, StringRef B); - void addScriptedSymbols(); bool hasPhdrsCommands(); uintX_t getOutputSectionSize(StringRef Name); std::vector<OutputSectionBase<ELFT> *> *OutputSections; private: - std::vector<std::pair<StringRef, const InputSectionDescription *>> - getSectionMap(); - std::vector<InputSectionBase<ELFT> *> getInputSections(const InputSectionDescription *); Index: ELF/LinkerScript.cpp =================================================================== --- ELF/LinkerScript.cpp +++ ELF/LinkerScript.cpp @@ -43,6 +43,36 @@ ScriptConfiguration *elf::ScriptConfig; +template <class ELFT> +static Symbol *addSymbolToSymtabAux(StringRef Name, uint8_t StOther) { + return Symtab<ELFT>::X->addRegular(Name, STB_GLOBAL, StOther); +} + +template <class ELFT> +static Symbol *addSymbolToSymtabAux(StringRef Name, typename ELFT::uint Value, + OutputSectionBase<ELFT> *Section) { + return Symtab<ELFT>::X->addSynthetic(Name, Section, Value); +} + +template <class ELFT, class... ArgsT> +static bool addSymbolToSymtab(SymbolAssignment &Cmd, ArgsT... Args) { + if (Cmd.Name == ".") + return false; + + // If a symbol was in PROVIDE(), define it only when it is an + // undefined symbol. + SymbolBody *B = Symtab<ELFT>::X->find(Cmd.Name); + if (Cmd.Provide && !(B && B->isUndefined())) + return false; + + Symbol *Sym = + addSymbolToSymtabAux<ELFT>(Cmd.Name, std::forward<ArgsT>(Args)...); + + Sym->Visibility = Cmd.Hidden ? STV_HIDDEN : STV_DEFAULT; + Cmd.Sym = Sym->body(); + return true; +} + bool SymbolAssignment::classof(const BaseCommand *C) { return C->Kind == AssignmentKind; } @@ -78,21 +108,6 @@ return false; } -// Create a vector of (<output section name>, <input section description>). -template <class ELFT> -std::vector<std::pair<StringRef, const InputSectionDescription *>> -LinkerScript<ELFT>::getSectionMap() { - std::vector<std::pair<StringRef, const InputSectionDescription *>> Ret; - - for (const std::unique_ptr<BaseCommand> &Base1 : Opt.Commands) - if (auto *Cmd1 = dyn_cast<OutputSectionCommand>(Base1.get())) - for (const std::unique_ptr<BaseCommand> &Base2 : Cmd1->Commands) - if (auto *Cmd2 = dyn_cast<InputSectionDescription>(Base2.get())) - Ret.emplace_back(Cmd1->Name, Cmd2); - - return Ret; -} - static bool fileMatches(const InputSectionDescription *Desc, StringRef Filename) { if (!globMatch(Desc->FilePattern, Filename)) @@ -121,18 +136,86 @@ return Ret; } -// Add input section to output section. If there is no output section yet, -// then create it and add to output section list. +namespace { +template <class ELFT> class LayoutInputSection : public InputSection<ELFT> { +public: + LayoutInputSection(SymbolAssignment *Cmd); + SymbolAssignment *Cmd; + +private: + typename ELFT::Shdr Hdr; +}; + +// Helper class, which builds output section list, also +// creating symbol sections, when needed +template <class ELFT> class OutputSectionBuilder { +public: + OutputSectionBuilder(OutputSectionFactory<ELFT> &F, + std::vector<OutputSectionBase<ELFT> *> *Out) + : Factory(F), OutputSections(Out) {} + + void addSection(StringRef OutputName, InputSectionBase<ELFT> *I); + void addSymbol(SymbolAssignment *Cmd) { + PendingSymbols.emplace_back(new LayoutInputSection<ELFT>(Cmd)); + } + void flushSymbols(); + void finalize(); + +private: + OutputSectionFactory<ELFT> &Factory; + std::vector<OutputSectionBase<ELFT> *> *OutputSections; + OutputSectionBase<ELFT> *Current = nullptr; + std::vector<std::unique_ptr<LayoutInputSection<ELFT>>> PendingSymbols; + static std::vector<std::unique_ptr<LayoutInputSection<ELFT>>> OwningSections; +}; + template <class ELFT> -static void addSection(OutputSectionFactory<ELFT> &Factory, - std::vector<OutputSectionBase<ELFT> *> &Out, - InputSectionBase<ELFT> *C, StringRef Name) { - OutputSectionBase<ELFT> *Sec; +std::vector<std::unique_ptr<LayoutInputSection<ELFT>>> + OutputSectionBuilder<ELFT>::OwningSections; +} + +template <class T> static T *zero(T *Val) { + memset(Val, 0, sizeof(*Val)); + return Val; +} + +template <class ELFT> +LayoutInputSection<ELFT>::LayoutInputSection(SymbolAssignment *Cmd) + : InputSection<ELFT>(nullptr, zero(&Hdr)), Cmd(Cmd) { + this->Live = true; + this->Repl = nullptr; + Hdr.sh_type = SHT_NOBITS; +} + +template <class ELFT> +void OutputSectionBuilder<ELFT>::addSection(StringRef OutputName, + InputSectionBase<ELFT> *C) { bool IsNew; - std::tie(Sec, IsNew) = Factory.create(C, Name); + std::tie(Current, IsNew) = Factory.create(C, OutputName); if (IsNew) - Out.push_back(Sec); - Sec->addSection(C); + OutputSections->push_back(Current); + flushSymbols(); + Current->addSection(C); +} + +template <class ELFT> void OutputSectionBuilder<ELFT>::flushSymbols() { + for (std::unique_ptr<LayoutInputSection<ELFT>> &I : PendingSymbols) + if (I->Cmd->Name == "." || addSymbolToSymtab<ELFT>(*I->Cmd, 0, Current)) { + Current->addSection(I.get()); + OwningSections.push_back(std::move(I)); + } + + PendingSymbols.clear(); +} + +template <class ELFT> void OutputSectionBuilder<ELFT>::finalize() { + // Assign offsets to all sections which don't contain symbols + for (OutputSectionBase<ELFT> *S : *OutputSections) + if (llvm::find_if(OwningSections, + [&](std::unique_ptr<LayoutInputSection<ELFT>> &L) { + return L->OutSec == S; + }) == OwningSections.end()) + S->assignOffsets(); } template <class ELFT> @@ -160,40 +243,51 @@ template <class ELFT> void LinkerScript<ELFT>::createSections( OutputSectionFactory<ELFT> &Factory) { - for (auto &P : getSectionMap()) { - StringRef OutputName = P.first; - const InputSectionDescription *Cmd = P.second; - std::vector<InputSectionBase<ELFT> *> Sections = getInputSections(Cmd); + OutputSectionBuilder<ELFT> Builder(Factory, OutputSections); + auto Add = [&](StringRef OutputName, const InputSectionDescription *Cmd) { + std::vector<InputSectionBase<ELFT> *> Sections = getInputSections(Cmd); if (OutputName == "/DISCARD/") { for (InputSectionBase<ELFT> *S : Sections) { S->Live = false; reportDiscarded(S); } - continue; + return; } - if (Cmd->SortInner) std::stable_sort(Sections.begin(), Sections.end(), getComparator<ELFT>(Cmd->SortInner)); if (Cmd->SortOuter) std::stable_sort(Sections.begin(), Sections.end(), getComparator<ELFT>(Cmd->SortOuter)); - for (InputSectionBase<ELFT> *S : Sections) - addSection(Factory, *OutputSections, S, OutputName); - } + Builder.addSection(OutputName, S); + }; + + for (const std::unique_ptr<BaseCommand> &Base1 : Opt.Commands) + if (auto *Cmd = dyn_cast<OutputSectionCommand>(Base1.get())) { + for (const std::unique_ptr<BaseCommand> &Base2 : Cmd->Commands) + if (auto *Assignment = dyn_cast<SymbolAssignment>(Base2.get())) + Builder.addSymbol(Assignment); + else + Add(Cmd->Name, cast<InputSectionDescription>(Base2.get())); + + Builder.flushSymbols(); + } else if (auto *Cmd2 = dyn_cast<SymbolAssignment>(Base1.get())) { + addSymbolToSymtab<ELFT>(*Cmd2, STV_DEFAULT); + } // Add all other input sections, which are not listed in script. for (const std::unique_ptr<ObjectFile<ELFT>> &F : Symtab<ELFT>::X->getObjectFiles()) for (InputSectionBase<ELFT> *S : F->getSections()) if (!isDiscarded(S) && !S->OutSec) - addSection(Factory, *OutputSections, S, getOutputSectionName(S)); + Builder.addSection(getOutputSectionName(S), S); // Remove from the output all the sections which did not meet // the optional constraints. filter(); + Builder.finalize(); } template <class R, class T> @@ -224,6 +318,33 @@ } } +template <class ELFT> void assignOffsets(OutputSectionBase<ELFT> *Sec) { + if (Sec->getSize()) + return; + + typedef typename ELFT::uint uintX_t; + uintX_t Off = 0; + OutputSection<ELFT> *OutSec = static_cast<OutputSection<ELFT> *>(Sec); + + for (InputSection<ELFT> *I : OutSec->Sections) { + if (!I->Repl) { + LayoutInputSection<ELFT> *L = static_cast<LayoutInputSection<ELFT> *>(I); + uintX_t Value = L->Cmd->Expression(Sec->getVA() + Off) - Sec->getVA(); + if (L->Cmd->Name == ".") + Off = Value; + else + cast<DefinedSynthetic<ELFT>>(L->Cmd->Sym)->Value = Value; + } else { + Off = alignTo(Off, I->Alignment); + I->OutSecOff = Off; + Off += I->getSize(); + } + // Update section size, so that SIZEOF works correctly in the case below: + // .foo { ... a = SIZEOF(.foo) ... } + Sec->setSize(Off); + } +} + template <class ELFT> void LinkerScript<ELFT>::assignAddresses() { ArrayRef<OutputSectionBase<ELFT> *> Sections = *OutputSections; // Orphan sections are sections present in the input files which @@ -275,6 +396,8 @@ uintX_t TVA = Dot + ThreadBssOffset; TVA = alignTo(TVA, Sec->getAlignment()); Sec->setVA(TVA); + if (Cmd->HasSymbols) + assignOffsets(Sec); ThreadBssOffset = TVA - Dot + Sec->getSize(); continue; } @@ -282,6 +405,8 @@ if (Sec->getFlags() & SHF_ALLOC) { Dot = alignTo(Dot, Sec->getAlignment()); Sec->setVA(Dot); + if (Cmd->HasSymbols) + assignOffsets(Sec); MinVA = std::min(MinVA, Dot); Dot += Sec->getSize(); continue; @@ -395,28 +520,6 @@ return I < J ? -1 : 1; } -// Add symbols defined by linker scripts. -template <class ELFT> void LinkerScript<ELFT>::addScriptedSymbols() { - for (const std::unique_ptr<BaseCommand> &Base : Opt.Commands) { - auto *Cmd = dyn_cast<SymbolAssignment>(Base.get()); - if (!Cmd || Cmd->Name == ".") - continue; - - // If a symbol was in PROVIDE(), define it only when it is an - // undefined symbol. - SymbolBody *B = Symtab<ELFT>::X->find(Cmd->Name); - if (Cmd->Provide && !(B && B->isUndefined())) - continue; - - // Define an absolute symbol. The symbol value will be assigned later. - // (At this point, we don't know the final address yet.) - Symbol *Sym = Symtab<ELFT>::X->addUndefined(Cmd->Name); - replaceBody<DefinedRegular<ELFT>>(Sym, Cmd->Name, STV_DEFAULT); - Sym->Visibility = Cmd->Hidden ? STV_HIDDEN : STV_DEFAULT; - Cmd->Sym = Sym->body(); - } -} - template <class ELFT> bool LinkerScript<ELFT>::hasPhdrsCommands() { return !Opt.PhdrsCommands.empty(); } @@ -494,6 +597,7 @@ unsigned readPhdrType(); SortKind readSortKind(); SymbolAssignment *readProvide(bool Hidden); + SymbolAssignment *readProvideOrAssignment(StringRef Tok); Expr readAlign(); void readSort(); Expr readAssert(); @@ -683,18 +787,12 @@ expect("{"); while (!Error && !skip("}")) { StringRef Tok = next(); - BaseCommand *Cmd; - if (peek() == "=" || peek() == "+=") { - Cmd = readAssignment(Tok); - expect(";"); - } else if (Tok == "PROVIDE") { - Cmd = readProvide(false); - } else if (Tok == "PROVIDE_HIDDEN") { - Cmd = readProvide(true); - } else if (Tok == "ASSERT") { - Cmd = new AssertCommand(readAssert()); - } else { - Cmd = readOutputSectionDescription(Tok); + BaseCommand *Cmd = readProvideOrAssignment(Tok); + if (!Cmd) { + if (Tok == "ASSERT") + Cmd = new AssertCommand(readAssert()); + else + Cmd = readOutputSectionDescription(Tok); } Opt.Commands.emplace_back(Cmd); } @@ -831,11 +929,15 @@ Cmd->Commands.emplace_back(readInputSectionDescription()); continue; } - if (skip("SORT")) { + + StringRef Tok = next(); + if (SymbolAssignment *Assignment = readProvideOrAssignment(Tok)) { + Cmd->Commands.emplace_back(Assignment); + Cmd->HasSymbols = true; + } else if (Tok == "SORT") readSort(); - continue; - } - setError("unknown command " + peek()); + else + setError("unknown command " + Tok); } Cmd->Phdrs = readOutputSectionPhdrs(); Cmd->Filler = readOutputSectionFiller(); @@ -872,6 +974,19 @@ return Cmd; } +SymbolAssignment *ScriptParser::readProvideOrAssignment(StringRef Tok) { + SymbolAssignment *Cmd = nullptr; + if (peek() == "=" || peek() == "+=") { + Cmd = readAssignment(Tok); + expect(";"); + } else if (Tok == "PROVIDE") { + Cmd = readProvide(false); + } else if (Tok == "PROVIDE_HIDDEN") { + Cmd = readProvide(true); + } + return Cmd; +} + static uint64_t getSymbolValue(StringRef S, uint64_t Dot) { if (S == ".") return Dot; Index: ELF/Symbols.cpp =================================================================== --- ELF/Symbols.cpp +++ ELF/Symbols.cpp @@ -58,7 +58,7 @@ Offset += Addend; Addend = 0; } - uintX_t VA = SC->OutSec->getVA() + SC->getOffset(Offset); + uintX_t VA = (SC->OutSec ? SC->OutSec->getVA() : 0) + SC->getOffset(Offset); if (D.isTls()) return VA - Out<ELFT>::TlsPhdr->p_vaddr; return VA; Index: ELF/Writer.cpp =================================================================== --- ELF/Writer.cpp +++ ELF/Writer.cpp @@ -230,6 +230,9 @@ copyLocalSymbols(); addReservedSymbols(); + if (Target->NeedsThunks) + forEachRelSec(createThunks<ELFT>); + CommonInputSection<ELFT> Common(getCommonSymbols<ELFT>()); CommonInputSection<ELFT>::X = &Common; @@ -657,6 +660,16 @@ Sec->addSection(C); } } + + sortInitFini( + Factory.lookup(".init_array", SHT_INIT_ARRAY, SHF_WRITE | SHF_ALLOC)); + sortInitFini( + Factory.lookup(".fini_array", SHT_FINI_ARRAY, SHF_WRITE | SHF_ALLOC)); + sortCtorsDtors(Factory.lookup(".ctors", SHT_PROGBITS, SHF_WRITE | SHF_ALLOC)); + sortCtorsDtors(Factory.lookup(".dtors", SHT_PROGBITS, SHF_WRITE | SHF_ALLOC)); + + for (OutputSectionBase<ELFT> *Sec : OutputSections) + Sec->assignOffsets(); } // Create output section objects and add them to OutputSections. @@ -676,12 +689,6 @@ Out<ELFT>::Dynamic->FiniArraySec = Factory.lookup(".fini_array", SHT_FINI_ARRAY, SHF_WRITE | SHF_ALLOC); - // Sort section contents for __attribute__((init_priority(N)). - sortInitFini(Out<ELFT>::Dynamic->InitArraySec); - sortInitFini(Out<ELFT>::Dynamic->FiniArraySec); - sortCtorsDtors(Factory.lookup(".ctors", SHT_PROGBITS, SHF_WRITE | SHF_ALLOC)); - sortCtorsDtors(Factory.lookup(".dtors", SHT_PROGBITS, SHF_WRITE | SHF_ALLOC)); - // The linker needs to define SECNAME_start, SECNAME_end and SECNAME_stop // symbols for sections, so that the runtime can get the start and end // addresses of each section by section name. Add such symbols. @@ -701,21 +708,11 @@ // Define __rel[a]_iplt_{start,end} symbols if needed. addRelIpltSymbols(); - // Add scripted symbols with zero values now. - // Real values will be assigned later - Script<ELFT>::X->addScriptedSymbols(); - if (!Out<ELFT>::EhFrame->empty()) { OutputSections.push_back(Out<ELFT>::EhFrame); Out<ELFT>::EhFrame->finalize(); } - if (Target->NeedsThunks) - forEachRelSec(createThunks<ELFT>); - - for (OutputSectionBase<ELFT> *Sec : OutputSections) - Sec->assignOffsets(); - // Scan relocations. This must be done after every symbol is declared so that // we can correctly decide if a dynamic relocation is needed. forEachRelSec(scanRelocations<ELFT>); Index: test/ELF/linkerscript/linkerscript-symbols-synthetic.s =================================================================== --- test/ELF/linkerscript/linkerscript-symbols-synthetic.s +++ test/ELF/linkerscript/linkerscript-symbols-synthetic.s @@ -0,0 +1,38 @@ +# REQUIRES: x86 +# RUN: llvm-mc -filetype=obj -triple=x86_64-unknown-linux %s -o %t + +# Simple symbol assignment within input section list. The '.' symbol +# is not location counter but offset from the beginning of output +# section .foo +# RUN: echo "SECTIONS { \ +# RUN: .foo : { \ +# RUN: begin_foo = .; \ +# RUN: *(.foo) \ +# RUN: end_foo = .; \ +# RUN: size_foo_1 = SIZEOF(.foo); \ +# RUN: . = ALIGN(0x1000); \ +# RUN: begin_bar = .; \ +# RUN: *(.bar) \ +# RUN: end_bar = .; \ +# RUN: size_foo_2 = SIZEOF(.foo); \ +# RUN: } \ +# RUN: size_foo_3 = SIZEOF(.foo); }" > %t.script +# RUN: ld.lld -o %t1 --script %t.script %t +# RUN: llvm-objdump -t %t1 | FileCheck --check-prefix=SIMPLE %s +# SIMPLE: 0000000000000120 .foo 00000000 begin_foo +# SIMPLE-NEXT: 0000000000000128 .foo 00000000 end_foo +# SIMPLE-NEXT: 0000000000000008 .foo 00000000 size_foo_1 +# SIMPLE-NEXT: 0000000000001000 .foo 00000000 begin_bar +# SIMPLE-NEXT: 0000000000001004 .foo 00000000 end_bar +# SIMPLE-NEXT: 0000000000000ee4 .foo 00000000 size_foo_2 +# SIMPLE-NEXT: 0000000000000ee4 *ABS* 00000000 size_foo_3 + +.global _start +_start: + nop + +.section .foo,"a" + .quad 0 + +.section .bar,"a" + .long 0