Index: ELF/LinkerScript.h =================================================================== --- ELF/LinkerScript.h +++ ELF/LinkerScript.h @@ -138,6 +138,7 @@ SortSectionPolicy SortInner; }; +class ThunkSection; struct InputSectionDescription : BaseCommand { InputSectionDescription(StringRef FilePattern) : BaseCommand(InputSectionKind), FilePat(FilePattern) {} @@ -153,6 +154,10 @@ std::vector SectionPatterns; std::vector Sections; + + // Temporary record of synthetic ThunkSection instances that we need to + // insert into Sections at the end of a createThunks() pass. + std::vector ThunkSections; }; // Represents an ASSERT(). Index: ELF/Relocations.h =================================================================== --- ELF/Relocations.h +++ ELF/Relocations.h @@ -121,6 +121,7 @@ class ThunkSection; class Thunk; +struct InputSectionDescription; class ThunkCreator { public: @@ -133,18 +134,17 @@ uint32_t Pass = 0; private: - void mergeThunks(); - ThunkSection *getOSThunkSec(OutputSection *OS, - std::vector *ISR); + void mergeThunks(ArrayRef OutputSections); + ThunkSection *getOSThunkSec(OutputSection *OS, InputSectionDescription *ISD); ThunkSection *getISThunkSec(InputSection *IS); - void forEachExecInputSection( + + void forEachInputSectionDescription( ArrayRef OutputSections, - std::function *, - InputSection *)> - Fn); + std::function Fn); + std::pair getThunk(SymbolBody &Body, uint32_t Type); - ThunkSection *addThunkSection(OutputSection *OS, - std::vector *, uint64_t Off); + ThunkSection *addThunkSection(OutputSection *OS, InputSectionDescription *, + uint64_t Off); // Record all the available Thunks for a Symbol llvm::DenseMap> ThunkedSymbols; @@ -157,16 +157,6 @@ // so we need to make sure that there is only one of them. // The Mips LA25 Thunk is an example of an inline ThunkSection. llvm::DenseMap ThunkedSections; - - // All the ThunkSections that we have created, organised by OutputSection - // will contain a mix of ThunkSections that have been created this pass, and - // ThunkSections that have been merged into the OutputSection on previous - // passes - std::map *, std::vector> - ThunkSections; - - // The ThunkSection for this vector of InputSections - ThunkSection *CurTS; }; // Return a int64_t to make sure we get the sign extension out of the way as Index: ELF/Relocations.cpp =================================================================== --- ELF/Relocations.cpp +++ ELF/Relocations.cpp @@ -987,40 +987,40 @@ scanRelocs(S, S.rels()); } -// Insert the Thunks for OutputSection OS into their designated place -// in the Sections vector, and recalculate the InputSection output section -// offsets. -// This may invalidate any output section offsets stored outside of InputSection -void ThunkCreator::mergeThunks() { - for (auto &KV : ThunkSections) { - std::vector *ISR = KV.first; - std::vector &Thunks = KV.second; - - // Order Thunks in ascending OutSecOff - auto ThunkCmp = [](const ThunkSection *A, const ThunkSection *B) { - return A->OutSecOff < B->OutSecOff; - }; - std::stable_sort(Thunks.begin(), Thunks.end(), ThunkCmp); - - // Merge sorted vectors of Thunks and InputSections by OutSecOff - std::vector Tmp; - Tmp.reserve(ISR->size() + Thunks.size()); - auto MergeCmp = [](const InputSection *A, const InputSection *B) { - // std::merge requires a strict weak ordering. - if (A->OutSecOff < B->OutSecOff) - return true; - if (A->OutSecOff == B->OutSecOff) - // Check if Thunk is immediately before any specific Target InputSection - // for example Mips LA25 Thunks. - if (auto *TA = dyn_cast(A)) - if (TA && TA->getTargetInputSection() == B) +// Merge the ThunkSections created this pass into the InputSectionDescriptions. +void ThunkCreator::mergeThunks(ArrayRef OutputSections) { + forEachInputSectionDescription( + OutputSections, [&](OutputSection *OS, InputSectionDescription *ISD) { + if (ISD->ThunkSections.empty()) + return; + + // Order Thunks in ascending OutSecOff + std::stable_sort(ISD->ThunkSections.begin(), ISD->ThunkSections.end(), + [](const ThunkSection *A, const ThunkSection *B) { + return A->OutSecOff < B->OutSecOff; + }); + + // Merge sorted vectors of Thunks and InputSections by OutSecOff + std::vector Tmp; + Tmp.reserve(ISD->Sections.size() + ISD->ThunkSections.size()); + auto MergeCmp = [](const InputSection *A, const InputSection *B) { + // std::merge requires a strict weak ordering. + if (A->OutSecOff < B->OutSecOff) return true; - return false; - }; - std::merge(ISR->begin(), ISR->end(), Thunks.begin(), Thunks.end(), - std::back_inserter(Tmp), MergeCmp); - *ISR = std::move(Tmp); - } + if (A->OutSecOff == B->OutSecOff) + // Check if Thunk is immediately before any specific Target + // InputSection for example Mips LA25 Thunks. + if (auto *TA = dyn_cast(A)) + if (TA && TA->getTargetInputSection() == B) + return true; + return false; + }; + std::merge(ISD->Sections.begin(), ISD->Sections.end(), + ISD->ThunkSections.begin(), ISD->ThunkSections.end(), + std::back_inserter(Tmp), MergeCmp); + ISD->Sections = std::move(Tmp); + ISD->ThunkSections.clear(); + }); } static uint32_t findEndOfFirstNonExec(OutputSection &Cmd) { @@ -1033,12 +1033,12 @@ } ThunkSection *ThunkCreator::getOSThunkSec(OutputSection *OS, - std::vector *ISR) { - if (CurTS == nullptr) { - uint32_t Off = findEndOfFirstNonExec(*OS); - CurTS = addThunkSection(OS, ISR, Off); - } - return CurTS; + InputSectionDescription *ISD) { + if (!ISD->ThunkSections.empty()) + return ISD->ThunkSections.front(); + + uint32_t Off = findEndOfFirstNonExec(*OS); + return addThunkSection(OS, ISD, Off); } // Add a Thunk that needs to be placed in a ThunkSection that immediately @@ -1051,27 +1051,25 @@ // Find InputSectionRange within Target Output Section (TOS) that the // InputSection (IS) that we need to precede is in. OutputSection *TOS = IS->getParent(); - std::vector *Range = nullptr; for (BaseCommand *BC : TOS->SectionCommands) if (auto *ISD = dyn_cast(BC)) { InputSection *first = ISD->Sections.front(); InputSection *last = ISD->Sections.back(); if (IS->OutSecOff >= first->OutSecOff && IS->OutSecOff <= last->OutSecOff) { - Range = &ISD->Sections; + TS = addThunkSection(TOS, ISD, IS->OutSecOff); + ThunkedSections[IS] = TS; break; } } - TS = addThunkSection(TOS, Range, IS->OutSecOff); - ThunkedSections[IS] = TS; return TS; } ThunkSection *ThunkCreator::addThunkSection(OutputSection *OS, - std::vector *ISR, + InputSectionDescription *ISD, uint64_t Off) { auto *TS = make(OS, Off); - ThunkSections[ISR].push_back(TS); + ISD->ThunkSections.push_back(TS); return TS; } @@ -1092,73 +1090,66 @@ // Call Fn on every executable InputSection accessed via the linker script // InputSectionDescription::Sections. -void ThunkCreator::forEachExecInputSection( +void ThunkCreator::forEachInputSectionDescription( ArrayRef OutputSections, - std::function *, - InputSection *)> - Fn) { + std::function Fn) { for (OutputSection *OS : OutputSections) { if (!(OS->Flags & SHF_ALLOC) || !(OS->Flags & SHF_EXECINSTR)) continue; for (BaseCommand *BC : OS->SectionCommands) - if (auto *ISD = dyn_cast(BC)) { - CurTS = nullptr; - for (InputSection *IS : ISD->Sections) - Fn(OS, &ISD->Sections, IS); - } + if (auto *ISD = dyn_cast(BC)) + Fn(OS, ISD); } } // Process all relocations from the InputSections that have been assigned -// to OutputSections and redirect through Thunks if needed. +// to InputSectionDescriptions and redirect through Thunks if needed. // // createThunks must be called after scanRelocs has created the Relocations for // each InputSection. It must be called before the static symbol table is -// finalized. If any Thunks are added to an OutputSection the output section -// offsets of the InputSections will change. +// finalized. If any Thunks are added to an InputSectionDescription the +// offsets within the OutputSection of the InputSections will change. // // FIXME: All Thunks are assumed to be in range of the relocation. Range // extension Thunks are not yet supported. bool ThunkCreator::createThunks(ArrayRef OutputSections) { - if (Pass > 0) - ThunkSections.clear(); - + bool AddressesChanged = false; // Create all the Thunks and insert them into synthetic ThunkSections. The - // ThunkSections are later inserted back into the OutputSection. - + // ThunkSections are later inserted back into InputSectionDescriptions. // We separate the creation of ThunkSections from the insertion of the - // ThunkSections back into the OutputSection as ThunkSections are not always - // inserted into the same OutputSection as the caller. - forEachExecInputSection(OutputSections, [&](OutputSection *OS, - std::vector *ISR, - InputSection *IS) { - for (Relocation &Rel : IS->Relocations) { - SymbolBody &Body = *Rel.Sym; - if (Thunks.find(&Body) != Thunks.end() || - !Target->needsThunk(Rel.Expr, Rel.Type, IS->File, Body)) - continue; - Thunk *T; - bool IsNew; - std::tie(T, IsNew) = getThunk(Body, Rel.Type); - if (IsNew) { - // Find or create a ThunkSection for the new Thunk - ThunkSection *TS; - if (auto *TIS = T->getTargetInputSection()) - TS = getISThunkSec(TIS); - else - TS = getOSThunkSec(OS, ISR); - TS->addThunk(T); - Thunks[T->ThunkSym] = T; - } - // Redirect relocation to Thunk, we never go via the PLT to a Thunk - Rel.Sym = T->ThunkSym; - Rel.Expr = fromPlt(Rel.Expr); - } - }); + // ThunkSections as ThunkSections are not always inserted into the same + // InputSectionDescription as the caller. + forEachInputSectionDescription( + OutputSections, [&](OutputSection *OS, InputSectionDescription *ISD) { + for (InputSection *IS : ISD->Sections) + for (Relocation &Rel : IS->Relocations) { + SymbolBody &Body = *Rel.Sym; + if (Thunks.find(&Body) != Thunks.end() || + !Target->needsThunk(Rel.Expr, Rel.Type, IS->File, Body)) + continue; + Thunk *T; + bool IsNew; + std::tie(T, IsNew) = getThunk(Body, Rel.Type); + if (IsNew) { + AddressesChanged = true; + // Find or create a ThunkSection for the new Thunk + ThunkSection *TS; + if (auto *TIS = T->getTargetInputSection()) + TS = getISThunkSec(TIS); + else + TS = getOSThunkSec(OS, ISD); + TS->addThunk(T); + Thunks[T->ThunkSym] = T; + } + // Redirect relocation to Thunk, we never go via the PLT to a Thunk + Rel.Sym = T->ThunkSym; + Rel.Expr = fromPlt(Rel.Expr); + } + }); // Merge all created synthetic ThunkSections back into OutputSection - mergeThunks(); + mergeThunks(OutputSections); ++Pass; - return !ThunkSections.empty(); + return AddressesChanged; } template void elf::scanRelocations(InputSectionBase &);