This is an archive of the discontinued LLVM Phabricator instance.

Paths

Table of Contentst

-
llvm/
-
include/llvm/
-
llvm/
-
CodeGen/
-
DwarfStringPoolEntry.h
-
DWARFLinker/
-
DWARFLinker.h
-
DWARFLinkerParallel/
-
AddressesMap.h
-
DWARFFile.h
-
StringPool.h
-
StringTable.h
-
DebugInfo/DWARF/
-
DWARF/
-
DWARFDebugMacro.h
-
lib/
-
DWARFLinker/
-
DWARFLinker.cpp
-
DWARFLinkerCompileUnit.cpp
-
DWARFLinkerParallel/
-
ArrayList.h
-
CMakeLists.txt
2
DIEAttributeCloner.h
-
DIEAttributeCloner.cpp
-
DIEGenerator.h
-
DWARFEmitterImpl.h
-
DWARFEmitterImpl.cpp
-
DWARFFile.cpp
1/4
DWARFLinkerCompileUnit.h
-
DWARFLinkerCompileUnit.cpp
-
DWARFLinkerGlobalData.h
-
DWARFLinkerImpl.h
-
DWARFLinkerImpl.cpp
-
DWARFLinkerUnit.h
-
DWARFLinkerUnit.cpp
-
DebugLineSectionEmitter.h
-
DependencyTracker.h
-
DependencyTracker.cpp
-
IndexedValuesMap.h
-
OutputSections.h
-
OutputSections.cpp
-
StringEntryToDwarfStringPoolEntryMap.h
-
test/tools/
-
tools/
-
dsymutil/
-
ARM/
-
DWARFLinkerParallel/
-
dwarf5-dwarf4-combination-macho.test
-
dwarf5-macho.test
-
fat-dylib-update.test
-
obfuscated.test
-
call-pc-reloc.test
-
dwarf5-addr-base.test
-
dwarf5-addrx-0x0-last.test
-
dwarf5-str-offsets-base-strx.test
-
empty-map.test
-
extern-alias.test
-
fat-arch-name.test
-
fat-arch-not-found.test
-
inlined-low_pc.c
-
preload.test
-
scattered.c
-
thumb.c
-
X86/
-
DWARFLinkerParallel/
-
basic-linking-bundle.test
-
basic-linking-x86.test
-
basic-lto-dw4-linking-x86.test
-
basic-lto-linking-x86.test
-
basic-with-libfat-test.test
-
empty_range.s
-
frame-1.test
-
frame-2.test
-
multiple-inputs.test
-
alias.test
-
call-site-entry-linking.test
-
call-site-entry-reloc.test
-
common-sym-multi.test
-
common-sym.test
-
custom-line-table.test
-
darwin-bundle.test
-
dead-stripped.cpp
-
debug-loc-base-addr.test
-
dwarf4-linetable.test
-
dwarf5-addrx.test
-
dwarf5-call-site-entry-reloc.test
-
dwarf5-dw-op-addrx.test
-
dwarf5-linetable.test
-
dwarf5-loclists.test
-
dwarf5-rnglists.test
-
eh_frame.test
-
empty-CU.test
-
fat-archive-input-i386.test
-
fat-object-input-x86_64.test
-
fat-object-input-x86_64h.test
-
generate-empty-CU.test
-
global_downgraded_to_static.c
-
inlined-static-variable.cpp
-
keep-func.test
-
label.test
-
label2.test
-
lc_build_version.test
-
location-expression.test
-
mismatch.m
-
modules-dwarf-version.m
-
modules-empty.m
-
multiple-inputs.test
-
object-prefix-path.test
-
op-convert-offset.test
-
op-convert.test
-
papertrail-warnings.test
-
reflection-dump.test
-
remarks-linking-archive.text
-
remarks-linking-bundle-empty.test
-
remarks-linking-bundle.test
-
remarks-linking-fat-bundle.test
-
reproducer.test
-
statistics.test
-
swift-ast-x86_64.test
-
swift-dwarf-loc.test
-
tail-call-linking.test
-
thinlto.test
-
timestamp-mismatch.test
-
tls-variable.test
-
union-fwd-decl.test
-
verify.test
-
llvm-dwarfutil/ELF/X86/
-
ELF/
-
X86/
-
DWARFLinkerParallel/
-
gc-default.test
-
dwarf4-macro-short.test
-
dwarf4-macro.test
-
dwarf5-addresses.test
-
dwarf5-attributes.test
-
dwarf5-line-str.test
-
dwarf5-loclists.test
-
dwarf5-macro-opcodeop.test
-
dwarf5-macro-short.test
-
dwarf5-macro.test
-
dwarf5-rnglists.test
-
gc-default.test
-
gc-func-overlapping-address-ranges.test
-
gc-maxpc.test
-
gc-no-garbage.test
-
gc-unit-overlapping-address-ranges.test
-
verify.test
-
tools/
-
dsymutil/
-
BinaryHolder.h
-
BinaryHolder.cpp
-
DwarfLinkerForBinary.cpp
-
llvm-dwarfutil/
-
DebugInfoLinker.cpp
-
unittests/
-
CodeGen/
-
DwarfStringPoolEntryRefTest.cpp
-
DWARFLinkerParallel/
-
CMakeLists.txt
-
StringPoolTest.cpp
-
StringTableTest.cpp

Differential D153268

[DWARFLinkerParallel] Add limited functionality to DWARFLinkerParallel.
ClosedPublic

Authored by avl on Jun 19 2023, 5:21 AM.

Download Raw Diff

Details

Reviewers

JDevlieghere
aprantl
dblaikie
clayborg
jdoerfert
rastogishubham

Commits

rG5f2a7fa67e9b: [Reland][Reland][DWARFLinkerParallel] Add limited functionality to…
rG0229dd0626b2: [Reland][DWARFLinkerParallel] Add limited functionality to DWARFLinkerParallel.
rG1506e4c77624: [DWARFLinkerParallel] Add limited functionality to DWARFLinkerParallel.

Summary

This patch is extracted from D96035, it adds support for the existing
DWARFLinker functionality. What is not supported yet:

Types deduplication(--odr mode).
Modules deduplication.
Generation of index tables.

run-time performance and memory requirements for clang binary --num-threads 16 :

----------------------------------------------------------------------------------
                                                      |  time, sec   |  mem, GB  |
----------------------------------------------------------------------------------
dsymutil --no-odr --accelerator None --linker llvm    |      44      |   18.0    |
----------------------------------------------------------------------------------
dsymutil --no-odr --accelerator None --linker apple   |     248      |   22.2    |
----------------------------------------------------------------------------------

run-time performance and memory requirements for clang binary --num-threads 1 :

----------------------------------------------------------------------------------
                                                      |  time, sec   |  mem, GB  |
----------------------------------------------------------------------------------
dsymutil --no-odr --accelerator None --linker llvm    |     242      |   17.2    |
----------------------------------------------------------------------------------
dsymutil --no-odr --accelerator None --linker apple   |     260      |   19.4    |
----------------------------------------------------------------------------------

The overall linking process looks like this:

parrallel_for_each(ObjectFile) {
  for_each (Compile Unit) {
    1. Load Clang modules.
  }

  parrallel_for_each(Compile Unit) {
    1. Load input DWARF for Compile Unit.
    2. Report warnings for Clang modules.
    3. Analyze live DIEs.
    4. Clone DIEs(Generate output DIEs and resulting DWARF tables).
        The result is set of sections corresponding to the current compile unit.
    5. Cleanup Input and Output DIEs.
  }

  Deallocate loaded Object file.
}

for_each (ObjectFile) {
  for_each (Compile Unit) {
    1. Set offsets to Compile Units DWARF sections.
    2. Sort offsets/attributes/patches to have a predictable result.
    3. Patch size/offsets fields.
    4. Generate index tables.
    5. Move DWARF sections of compile units into the resulting file.
 }
}

Every compile unit is processed separately, visited only once
(except case inter-CU references exist), and used data is freed
after the compile unit is processed. The resulting file is glued together
from the generated debug tables which correspond to separate compile units.

Handling inter-CU references: inter-CU references are hard to process
using only one pass. f.e. if CU1 references CU100 and CU100 references
CU1, we could not finish handling of CU1 until we finished CU100.
Thus we either need to load all CUs into the memory, either load CUs several
times. This implementation loads inter-connected CU into memory at the first
pass and processes them at the second pass.

Changes from the current implementation(making DWARFLinkerParallel to be binary incompatible with current DWARFLinker):

a) No common abbreviation table. Each compile unit has

its own abbreviation table. Generating common abbreviation table slowdowns parallel execution(This is a resource that is accessed many times from many threads). Abbreviation table does not take a lot of space, so it looks cheap to have separate abbreviations tables.
Later, it might be optimized a bit(by removing equal abbreviations tables).

b) .debug_frame. Already generated CIE records are not reused between object files

c) location expressions, containing type references, use fixed-length ULEB128 format as they need to be patched after reference body is generated.

d) live tracking algorithm does not depend on the order of DW_TAG_import_module nodes and in some cases keep more DIEs.

Diff Detail

Repository: rG LLVM Github Monorepo

Event Timeline

avl created this revision.Jun 19 2023, 5:21 AM

Herald added a project: Restricted Project. · View Herald TranscriptJun 19 2023, 5:21 AM

Herald added subscribers: ormris, jdoerfert, steven_wu and 3 others. · View Herald Transcript

avl requested review of this revision.Jun 19 2023, 5:21 AM

Herald added a reviewer: jdoerfert. · View Herald TranscriptJun 19 2023, 5:21 AM

Herald added a project: Restricted Project. · View Herald Transcript

Herald added subscribers: llvm-commits, jplehr, sstefan1, MaskRay. · View Herald Transcript

avl edited the summary of this revision. (Show Details)Jun 19 2023, 5:23 AM

avl edited the summary of this revision. (Show Details)Jun 19 2023, 5:59 AM

avl edited the summary of this revision. (Show Details)

Harbormaster completed remote builds in B239781: Diff 532614.Jun 19 2023, 6:06 AM

avl edited the summary of this revision. (Show Details)Jun 19 2023, 6:09 AM

a) No common abbreviation table. Each compile unit has its own abbreviation table. Generating common abbreviation table slowdowns parallel execution(This is a resource that is accessed many times from many threads). Abbreviation table does not take a lot of space, so it looks cheap to have separate abbreviations tables. Later, it might be optimized a bit(by removing equal abbreviations tables).

Can't we just let each compile unit generate its own abbrev table and then unique them into a single abbrev table at when we write out the .debug_info data? That way compile units can stay fast in parallel execution, and since we need to emit the compile units serially when generating the .debug_info, we can just have a map that maps CU specific abbrev codes to the global and final abbrev list? Then we end up with just one .debug_abbrev table in the end

In D153268#4435883, @clayborg wrote:

a) No common abbreviation table. Each compile unit has its own abbreviation table. Generating common abbreviation table slowdowns parallel execution(This is a resource that is accessed many times from many threads). Abbreviation table does not take a lot of space, so it looks cheap to have separate abbreviations tables. Later, it might be optimized a bit(by removing equal abbreviations tables).

Can't we just let each compile unit generate its own abbrev table and then unique them into a single abbrev table at when we write out the .debug_info data? That way compile units can stay fast in parallel execution, and since we need to emit the compile units serially when generating the .debug_info, we can just have a map that maps CU specific abbrev codes to the global and final abbrev list? Then we end up with just one .debug_abbrev table in the end

The problem with this solution seems that when local abbreviation number would be replaced with global number(which is ULEB128 format) the DIEs offsets will be changed(because size of global number may differ from the size of local number). It will brake all sizes and references.

Also, currently CU is emitted(when we write out the .debug_info data) immediately. The global abbreviation table might be done in the very end after all CUs are emitted. That means we need to parse already emitted CU and update abbreviation numbers. It would probably slowdown execution.

The size of abbreviation table for clang binary having .debug_info 1.7G : 12.5K for DWARFLinker and 7.2M for DWARFLinkerParallel. i.e. new abbreviation table is approx 0.5% of overall .debug_info size. It looks relatively cheap. Though, any solution making .debug_abbrev shorter would certainly be good. Probably we might experiment with fixed length abbreviation numbers...

Another solution might be to use abbreviation table from already generated CU for the next CU. So that in any concrete moment current CU owns abbreviation table, but finally single abbreviation table would be shared between several CUs. That way, there still would exist several tables but some of them would be shared. It would reduce current size of .debug_abbrev.

In D153268#4435984, @avl wrote:

In D153268#4435883, @clayborg wrote:

a) No common abbreviation table. Each compile unit has its own abbreviation table. Generating common abbreviation table slowdowns parallel execution(This is a resource that is accessed many times from many threads). Abbreviation table does not take a lot of space, so it looks cheap to have separate abbreviations tables. Later, it might be optimized a bit(by removing equal abbreviations tables).

Can't we just let each compile unit generate its own abbrev table and then unique them into a single abbrev table at when we write out the .debug_info data? That way compile units can stay fast in parallel execution, and since we need to emit the compile units serially when generating the .debug_info, we can just have a map that maps CU specific abbrev codes to the global and final abbrev list? Then we end up with just one .debug_abbrev table in the end

The problem with this solution seems that when local abbreviation number would be replaced with global number(which is ULEB128 format) the DIEs offsets will be changed(because size of global number may differ from the size of local number). It will brake all sizes and references.

We make up DIEs to emit, but _as_ we emit the DIEs from a CU, can't we globalize the abbrev from the local CU as they are being emitted? Each abbrev could cache its global value if it has already been emitted from each CU. I am thinking that DIEs would have references to other DIEs using pointers when they are stored in intermediate form but this might not be true coming to think about it. If reference would need to be updated then this wouldn't work as you mentioned.

Also, currently CU is emitted(when we write out the .debug_info data) immediately. The global abbreviation table might be done in the very end after all CUs are emitted. That means we need to parse already emitted CU and update abbreviation numbers. It would probably slowdown execution.

Yeah, if DIE refs are done with hard coded offsets up front then this wouldn't work. A DWARF generator a created in python has references pointing to a DIE object so that it can ask that object for its offset when a reference is needed, and if it isn't available yet, it gets added to a fixup list for forward refs, and then they get fixed up in a post CU output phase. This is nice because I never have to worry about reference offsets as they "just work". I admit I am not as familiar with out the LLVM DWARFLinker does things.

The size of abbreviation table for clang binary having .debug_info 1.7G : 12.5K for DWARFLinker and 7.2M for DWARFLinkerParallel. i.e. new abbreviation table is approx 0.5% of overall .debug_info size. It looks relatively cheap. Though, any solution making .debug_abbrev shorter would certainly be good. Probably we might experiment with fixed length abbreviation numbers...

No real worry if the size isn't too big.

In D153268#4436009, @avl wrote:

Another solution might be to use abbreviation table from already generated CU for the next CU. So that in any concrete moment current CU owns abbreviation table, but finally single abbreviation table would be shared between several CUs. That way, there still would exist several tables but some of them would be shared. It would reduce current size of .debug_abbrev.

I like this idea. Not needed for this patch, but sounds like a good idea.

In D153268#4436350, @clayborg wrote:

In D153268#4435984, @avl wrote:

In D153268#4435883, @clayborg wrote:

a) No common abbreviation table. Each compile unit has its own abbreviation table. Generating common abbreviation table slowdowns parallel execution(This is a resource that is accessed many times from many threads). Abbreviation table does not take a lot of space, so it looks cheap to have separate abbreviations tables. Later, it might be optimized a bit(by removing equal abbreviations tables).

Can't we just let each compile unit generate its own abbrev table and then unique them into a single abbrev table at when we write out the .debug_info data? That way compile units can stay fast in parallel execution, and since we need to emit the compile units serially when generating the .debug_info, we can just have a map that maps CU specific abbrev codes to the global and final abbrev list? Then we end up with just one .debug_abbrev table in the end

The problem with this solution seems that when local abbreviation number would be replaced with global number(which is ULEB128 format) the DIEs offsets will be changed(because size of global number may differ from the size of local number). It will brake all sizes and references.

We make up DIEs to emit, but _as_ we emit the DIEs from a CU, can't we globalize the abbrev from the local CU as they are being emitted?

We can, but after abbrev numbers are globalized we need to update all size and reference fields and rewrite emitted DWARF.

Each abbrev could cache its global value if it has already been emitted from each CU. I am thinking that DIEs would have references to other DIEs using pointers when they are stored in intermediate form but this might not be true coming to think about it. If reference would need to be updated then this wouldn't work as you mentioned.

this patch uses Codegen DIE. It does not use pointers for references/sizes/offsets. These are absolute values:

DIE::setOffset()
DIE::setSize()
DIE::addValue(DIEAlloc, dwarf::Attribute(AttrSpec.Attr), dwarf::DW_FORM_ref_addr, DIEInteger(0x0)))

Also, currently CU is emitted(when we write out the .debug_info data) immediately. The global abbreviation table might be done in the very end after all CUs are emitted. That means we need to parse already emitted CU and update abbreviation numbers. It would probably slowdown execution.

Yeah, if DIE refs are done with hard coded offsets up front then this wouldn't work. A DWARF generator a created in python has references pointing to a DIE object so that it can ask that object for its offset when a reference is needed, and if it isn't available yet, it gets added to a fixup list for forward refs, and then they get fixed up in a post CU output phase. This is nice because I never have to worry about reference offsets as they "just work". I admit I am not as familiar with out the LLVM DWARFLinker does things.

Yes. that is the case - DIEs emitted before global abbreviations are known. This patch does similar fixup handling for references(write proper values later, when they are known). But that fixup occurs for fixed-size fields. For patching variable size fileds(like LEB128) it is necessary to rewrite already generated DWARF(as we need to shift data because of changed fields length).

The size of abbreviation table for clang binary having .debug_info 1.7G : 12.5K for DWARFLinker and 7.2M for DWARFLinkerParallel. i.e. new abbreviation table is approx 0.5% of overall .debug_info size. It looks relatively cheap. Though, any solution making .debug_abbrev shorter would certainly be good. Probably we might experiment with fixed length abbreviation numbers...

No real worry if the size isn't too big.

In D153268#4436351, @clayborg wrote:

In D153268#4436009, @avl wrote:

Another solution might be to use abbreviation table from already generated CU for the next CU. So that in any concrete moment current CU owns abbreviation table, but finally single abbreviation table would be shared between several CUs. That way, there still would exist several tables but some of them would be shared. It would reduce current size of .debug_abbrev.

I like this idea. Not needed for this patch, but sounds like a good idea.

Though there is some difficulty with this solution. The binary content would be non-deterministic. As it can not be guaranteed which CU share which abbreviation table.

Do we need to preserve binary representation to be deterministic(byte to byte equal between runs)?

Probably we could use special dumping which would be deterministic? Like dumping from https://reviews.llvm.org/D124082. In spite of the fact that source files are not byte to byte equal - the contents of the dump would be byte to byte equal.

I don't have all of dsymutil paged in to do a really thorough/meaningful review of all the details. Even if I did I'm sure a bunch of stuff would slip through that would only be caught by real world qualification.

At a high level I think the approach makes sense. I've spent quite a bit of time thinking of alternatives and I cant't think of anything more efficient given the constraints that we have (i.e. not being able to keep all the input DWARF concurrently in memory).

As for the implementation itself:

I like that you factored out things like the attribute cloning and I wonder if we could hoist this up and make it work with the non-parallel linker as well. I don't think we should go to extreme lengths to unify the two implementations, but even if we were to switch over to the new (parallel) implementation tomorrow, I expect the old one to be around for at least a few more years and I'd hate to have to maintain both.
I wonder if we could make the stages more explicit. If I'm reading the code right, the data (i.e. the DIE) and the logic (i.e. the live analysis) are shared in the same class and we have to maintain state. I would prefer a design where the two are decoupled and the data moves through the different stages. The way I'm imagining this is to have a class for every stage, possibly with its own shared context, and then have the DIEs move through them one after the other. It's fine for the DIE to know what stage we're in, but it would avoid things like init and reset iteration.

I left some inline comments here and there but I definitely need to do another pass.

llvm/lib/DWARFLinkerParallel/DIEAttributeCloner.h
48
68	Let's make these Doxygen style comments as well.
llvm/lib/DWARFLinkerParallel/DWARFLinkerCompileUnit.h
27	This should be singular: i.e. `Stage`.
97	How about `clear` or `reset`?
263	We need the `reinterpret_cast` because the `OutDieOffsetArray` stores `uint64_t`s instead of `std::atomic<uint64_t>`. Why can't we store the latter?

In D153268#4438509, @JDevlieghere wrote:

I don't have all of dsymutil paged in to do a really thorough/meaningful review of all the details. Even if I did I'm sure a bunch of stuff would slip through that would only be caught by real world qualification.

At a high level I think the approach makes sense. I've spent quite a bit of time thinking of alternatives and I cant't think of anything more efficient given the constraints that we have (i.e. not being able to keep all the input DWARF concurrently in memory).

As for the implementation itself:

I like that you factored out things like the attribute cloning and I wonder if we could hoist this up and make it work with the non-parallel linker as well. I don't think we should go to extreme lengths to unify the two implementations, but even if we were to switch over to the new (parallel) implementation tomorrow, I expect the old one to be around for at least a few more years and I'd hate to have to maintain both.

yes, it would be good to have single implementation. But I do not see the simple way to do it.
Actually there are other cases using similar code. f.e.

llvm/unittests/DebugInfo/DWARF/DwarfGenerator.h
https://reviews.llvm.org/D130315 .

Thus, it would be useful if we have kind of DWARFLinkerBase library, containing general code for cloning, creating and emitting DIEs.
That library might be used by DWARFLinker, DWARFLinkerParallel, unittests for DebugInfo, BOLT.
Though, I think there are a lot of details which will make implementing that library difficult task.

Anyway, if we want to have single implementation for it then, probably, the best way would be to think of creating DWARFLinkerBase library.
That library should have base implementations for compile units, for code cloning, creating and emitting DIEs, this library should not depend on AsmPrinter.
What do you think?

I wonder if we could make the stages more explicit. If I'm reading the code right, the data (i.e. the DIE) and the logic (i.e. the live analysis) are shared in the same class and we have to maintain state. I would prefer a design where the two are decoupled and the data moves through the different stages. The way I'm imagining this is to have a class for every stage, possibly with its own shared context, and then have the DIEs move through them one after the other. It's fine for the DIE to know what stage we're in, but it would avoid things like init and reset iteration.

If I understood correctly, it looks like the current picture is quite close to that description:

The CompileUnit contains data shared between stages and compile units know the current stage.
There is a separate class doing liveness analysys: DependencyTracker.
This class uses data keeping by CompileUnit(this data is shared context).
The result of liveness analysys is used by other stages that is why compile unit keeps the data.

We need "init" and "reset" functions as we need to erase data keeping by compile unit when we return to previous stages.
i.e. when we return to the previous stage we need to adapt shared context.
Probably instead of "init" and "reset" we need to name methods "sync shared context with the current stage" ?

llvm/lib/DWARFLinkerParallel/DWARFLinkerCompileUnit.h
263	std::atomic<> does not have copy constructor/operator. Because of this it could not be put into SmallVector.

rebased. addressed comments.

Harbormaster completed remote builds in B240743: Diff 533936.Jun 23 2023, 6:45 AM

rebased.

Harbormaster completed remote builds in B242570: Diff 536448.Jun 30 2023, 5:23 PM

avl mentioned this in D140791: [DWARFLinkerParallel] Add simple list with thread safe insertions..Jul 3 2023, 10:41 AM

rebased.

Harbormaster completed remote builds in B243954: Diff 538391.Jul 8 2023, 4:15 PM

avl added a child revision: D154793: [DWARFLinkerParallel] Add support of accelerator tables to DWARFLinkerParallel..Jul 9 2023, 10:17 AM

avl added a reviewer: rastogishubham.Jul 10 2023, 5:45 AM

friendly ping.

rebased.

@JDevlieghere @aprantl

Does this patch require some changes?

Previous comment asks for refactoring attributes cloning. Should we create some DWARFLinkerBase library for this?

Harbormaster completed remote builds in B249511: Diff 546089.Aug 1 2023, 10:00 AM

In D153268#4550774, @avl wrote:

@JDevlieghere @aprantl

Does this patch require some changes?

Previous comment asks for refactoring attributes cloning. Should we create some DWARFLinkerBase library for this?

No major concerns that block landing this. I still feel it would be great to unify stuff but we can do that incrementally after the patch has landed.

This revision is now accepted and ready to land.Aug 1 2023, 10:59 AM

Thank you for the review!

rebased.

Herald added a subscriber: arphaman. · View Herald TranscriptAug 15 2023, 7:27 AM

Harbormaster completed remote builds in B252637: Diff 550326.Aug 15 2023, 8:23 AM

rebased.

Harbormaster completed remote builds in B252976: Diff 550792.Aug 16 2023, 11:21 AM

JDevlieghere accepted this revision.Aug 16 2023, 12:55 PM

Closed by commit rG1506e4c77624: [DWARFLinkerParallel] Add limited functionality to DWARFLinkerParallel. (authored by avl). · Explain WhyAug 17 2023, 12:49 AM

This revision was automatically updated to reflect the committed changes.

avl added a commit: rG1506e4c77624: [DWARFLinkerParallel] Add limited functionality to DWARFLinkerParallel..

avl added a reverting change: rG32484c1724be: Revert "[DWARFLinkerParallel] Add limited functionality to DWARFLinkerParallel.".Aug 17 2023, 3:53 AM

avl added a commit: rG0229dd0626b2: [Reland][DWARFLinkerParallel] Add limited functionality to DWARFLinkerParallel..Aug 19 2023, 3:21 AM

nikic added a reverting change: rGfab91e950966: Revert "[Reland][DWARFLinkerParallel] Add limited functionality to….Aug 21 2023, 1:39 AM

Reverted due to test failures on s390x, see e.g. https://lab.llvm.org/buildbot/#/builders/94/builds/16146.

avl added a commit: rG5f2a7fa67e9b: [Reland][Reland][DWARFLinkerParallel] Add limited functionality to….Aug 21 2023, 2:12 AM

Revision Contents

Path

Size

llvm/

include/

llvm/

CodeGen/

DwarfStringPoolEntry.h

35 lines

DWARFLinker/

DWARFLinker.h

4 lines

DWARFLinkerParallel/

104 lines

12 lines

4 lines

DebugInfo/

DWARF/

DWARFDebugMacro.h

1 line

lib/

DWARFLinker/

DWARFLinker.cpp

2 lines

DWARFLinkerCompileUnit.cpp

2 lines

DWARFLinkerParallel/

ArrayList.h

92 lines

CMakeLists.txt

5 lines

DIEAttributeCloner.h

147 lines

DIEAttributeCloner.cpp

568 lines

165 lines

211 lines

113 lines

18 lines

DWARFLinkerCompileUnit.h

468 lines

DWARFLinkerCompileUnit.cpp

1396 lines

DWARFLinkerGlobalData.h

159 lines

298 lines

1078 lines

131 lines

130 lines

DebugLineSectionEmitter.h

384 lines

DependencyTracker.h

102 lines

DependencyTracker.cpp

428 lines

IndexedValuesMap.h

49 lines

OutputSections.h

411 lines

OutputSections.cpp

393 lines

StringEntryToDwarfStringPoolEntryMap.h

72 lines

test/

tools/

dsymutil/

ARM/

DWARFLinkerParallel/

dwarf5-dwarf4-combination-macho.test

200 lines

dwarf5-macho.test

92 lines

fat-dylib-update.test

110 lines

obfuscated.test

119 lines

call-pc-reloc.test

3 lines

dwarf5-addr-base.test

28 lines

dwarf5-addrx-0x0-last.test

8 lines

dwarf5-str-offsets-base-strx.test

253 lines

empty-map.test

2 lines

extern-alias.test

4 lines

fat-arch-name.test

2 lines

fat-arch-not-found.test

2 lines

4 lines

5 lines

8 lines

5 lines

X86/

DWARFLinkerParallel/

basic-linking-bundle.test

41 lines

basic-linking-x86.test

190 lines

basic-lto-dw4-linking-x86.test

183 lines

basic-lto-linking-x86.test

182 lines

basic-with-libfat-test.test

12 lines

empty_range.s

53 lines

frame-1.test

36 lines

frame-2.test

46 lines

	DWARFLinkerParallel/

multiple-inputs.test

15 lines

alias.test

4 lines

call-site-entry-linking.test

3 lines

call-site-entry-reloc.test

3 lines

common-sym-multi.test

3 lines

common-sym.test

2 lines

custom-line-table.test

2 lines

darwin-bundle.test

7 lines

dead-stripped.cpp

5 lines

debug-loc-base-addr.test

2 lines

dwarf4-linetable.test

2 lines

dwarf5-addrx.test

11 lines

dwarf5-call-site-entry-reloc.test

3 lines

dwarf5-dw-op-addrx.test

8 lines

dwarf5-linetable.test

2 lines

8 lines

10 lines

5 lines

2 lines

fat-archive-input-i386.test

2 lines

fat-object-input-x86_64.test

2 lines

fat-object-input-x86_64h.test

2 lines

generate-empty-CU.test

10 lines

global_downgraded_to_static.c

6 lines

inlined-static-variable.cpp

5 lines

keep-func.test

5 lines

label.test

2 lines

label2.test

3 lines

lc_build_version.test

3 lines

location-expression.test

17 lines

mismatch.m

2 lines

modules-dwarf-version.m

3 lines

modules-empty.m

7 lines

multiple-inputs.test

1 line

object-prefix-path.test

5 lines

op-convert-offset.test

10 lines

op-convert.test

3 lines

papertrail-warnings.test

2 lines

reflection-dump.test

3 lines

remarks-linking-archive.text

7 lines

remarks-linking-bundle-empty.test

5 lines

remarks-linking-bundle.test

8 lines

remarks-linking-fat-bundle.test

7 lines

reproducer.test

6 lines

statistics.test

1 line

swift-ast-x86_64.test

6 lines

swift-dwarf-loc.test

2 lines

tail-call-linking.test

3 lines

thinlto.test

3 lines

timestamp-mismatch.test

2 lines

tls-variable.test

1 line

union-fwd-decl.test

3 lines

verify.test

19 lines

llvm-dwarfutil/

ELF/

X86/

DWARFLinkerParallel/

gc-default.test

dwarf4-macro-short.test

4 lines

dwarf4-macro.test

17 lines

dwarf5-addresses.test

16 lines

dwarf5-attributes.test

16 lines

dwarf5-line-str.test

16 lines

dwarf5-loclists.test

12 lines

dwarf5-macro-opcodeop.test

4 lines

dwarf5-macro-short.test

4 lines

dwarf5-macro.test

17 lines

dwarf5-rnglists.test

12 lines

gc-default.test

6 lines

gc-func-overlapping-address-ranges.test

3 lines

gc-maxpc.test

3 lines

gc-no-garbage.test

2 lines

gc-unit-overlapping-address-ranges.test

3 lines

verify.test

5 lines

tools/

dsymutil/

BinaryHolder.h

3 lines

BinaryHolder.cpp

21 lines

DwarfLinkerForBinary.cpp

38 lines

llvm-dwarfutil/

DebugInfoLinker.cpp

48 lines

unittests/

CodeGen/

DwarfStringPoolEntryRefTest.cpp

34 lines

DWARFLinkerParallel/

CMakeLists.txt

1 line

StringPoolTest.cpp

5 lines

StringTableTest.cpp

Diff 551031

llvm/include/llvm/CodeGen/DwarfStringPoolEntry.h

Show All 21 Lines	struct DwarfStringPoolEntry {

MCSymbol *Symbol = nullptr;		MCSymbol *Symbol = nullptr;
uint64_t Offset = 0;		uint64_t Offset = 0;
unsigned Index = 0;		unsigned Index = 0;

bool isIndexed() const { return Index != NotIndexed; }		bool isIndexed() const { return Index != NotIndexed; }
};		};

		/// DwarfStringPoolEntry with string keeping externally.
		struct DwarfStringPoolEntryWithExtString : public DwarfStringPoolEntry {
		StringRef String;
		};

/// DwarfStringPoolEntryRef: Dwarf string pool entry reference.		/// DwarfStringPoolEntryRef: Dwarf string pool entry reference.
///		///
/// Dwarf string pool entry keeps string value and its data.		/// Dwarf string pool entry keeps string value and its data.
/// There are two variants how data are represented:		/// There are two variants how data are represented:
///		///
/// 1. By value - StringMapEntry<DwarfStringPoolEntry>.		/// 1. String data in pool - StringMapEntry<DwarfStringPoolEntry>.
/// 2. By pointer - StringMapEntry<DwarfStringPoolEntry *>.		/// 2. External string data - DwarfStringPoolEntryWithExtString.
///		///
/// The "By pointer" variant allows for reducing memory usage for the case		/// The external data variant allows reducing memory usage for the case
/// when string pool entry does not have data: it keeps the null pointer		/// when string pool entry does not have data: string entry does not
/// and so no need to waste space for the full DwarfStringPoolEntry.		/// keep any data and so no need to waste space for the full
/// It is recommended to use "By pointer" variant if not all entries		/// DwarfStringPoolEntry. It is recommended to use external variant if not all
/// of dwarf string pool have corresponding DwarfStringPoolEntry.		/// entries of dwarf string pool have corresponding DwarfStringPoolEntry.

class DwarfStringPoolEntryRef {		class DwarfStringPoolEntryRef {
/// Pointer type for "By value" string entry.		/// Pointer type for "By value" string entry.
using ByValStringEntryPtr = const StringMapEntry<DwarfStringPoolEntry> *;		using ByValStringEntryPtr = const StringMapEntry<DwarfStringPoolEntry> *;

/// Pointer type for "By pointer" string entry.		/// Pointer type for external string entry.
using ByPtrStringEntryPtr = const StringMapEntry<DwarfStringPoolEntry > ;		using ExtStringEntryPtr = const DwarfStringPoolEntryWithExtString *;

/// Pointer to the dwarf string pool Entry.		/// Pointer to the dwarf string pool Entry.
PointerUnion<ByValStringEntryPtr, ByPtrStringEntryPtr> MapEntry = nullptr;		PointerUnion<ByValStringEntryPtr, ExtStringEntryPtr> MapEntry = nullptr;

public:		public:
DwarfStringPoolEntryRef() = default;		DwarfStringPoolEntryRef() = default;

/// ASSUMPTION: DwarfStringPoolEntryRef keeps pointer to \p Entry,		/// ASSUMPTION: DwarfStringPoolEntryRef keeps pointer to \p Entry,
/// thus specified entry mustn`t be reallocated.		/// thus specified entry mustn`t be reallocated.
DwarfStringPoolEntryRef(const StringMapEntry<DwarfStringPoolEntry> &Entry)		DwarfStringPoolEntryRef(const StringMapEntry<DwarfStringPoolEntry> &Entry)
: MapEntry(&Entry) {}		: MapEntry(&Entry) {}

/// ASSUMPTION: DwarfStringPoolEntryRef keeps pointer to \p Entry,		/// ASSUMPTION: DwarfStringPoolEntryRef keeps pointer to \p Entry,
/// thus specified entry mustn`t be reallocated.		/// thus specified entry mustn`t be reallocated.
DwarfStringPoolEntryRef(const StringMapEntry<DwarfStringPoolEntry *> &Entry)		DwarfStringPoolEntryRef(const DwarfStringPoolEntryWithExtString &Entry)
: MapEntry(&Entry) {		: MapEntry(&Entry) {}
assert(cast<ByPtrStringEntryPtr>(MapEntry)->second != nullptr);
}

explicit operator bool() const { return !MapEntry.isNull(); }		explicit operator bool() const { return !MapEntry.isNull(); }

/// \returns symbol for the dwarf string.		/// \returns symbol for the dwarf string.
MCSymbol *getSymbol() const {		MCSymbol *getSymbol() const {
assert(getEntry().Symbol && "No symbol available!");		assert(getEntry().Symbol && "No symbol available!");
return getEntry().Symbol;		return getEntry().Symbol;
}		}

/// \returns offset for the dwarf string.		/// \returns offset for the dwarf string.
uint64_t getOffset() const { return getEntry().Offset; }		uint64_t getOffset() const { return getEntry().Offset; }

/// \returns index for the dwarf string.		/// \returns index for the dwarf string.
unsigned getIndex() const {		unsigned getIndex() const {
assert(getEntry().isIndexed() && "Index is not set!");		assert(getEntry().isIndexed() && "Index is not set!");
return getEntry().Index;		return getEntry().Index;
}		}

/// \returns string.		/// \returns string.
StringRef getString() const {		StringRef getString() const {
if (isa<ByValStringEntryPtr>(MapEntry))		if (isa<ByValStringEntryPtr>(MapEntry))
return cast<ByValStringEntryPtr>(MapEntry)->first();		return cast<ByValStringEntryPtr>(MapEntry)->first();

return cast<ByPtrStringEntryPtr>(MapEntry)->first();		return cast<ExtStringEntryPtr>(MapEntry)->String;
}		}

/// \returns the entire string pool entry for convenience.		/// \returns the entire string pool entry for convenience.
const DwarfStringPoolEntry &getEntry() const {		const DwarfStringPoolEntry &getEntry() const {
if (isa<ByValStringEntryPtr>(MapEntry))		if (isa<ByValStringEntryPtr>(MapEntry))
return cast<ByValStringEntryPtr>(MapEntry)->second;		return cast<ByValStringEntryPtr>(MapEntry)->second;

return *cast<ByPtrStringEntryPtr>(MapEntry)->second;		return *cast<ExtStringEntryPtr>(MapEntry);
}		}

bool operator==(const DwarfStringPoolEntryRef &X) const {		bool operator==(const DwarfStringPoolEntryRef &X) const {
return MapEntry.getOpaqueValue() == X.MapEntry.getOpaqueValue();		return MapEntry.getOpaqueValue() == X.MapEntry.getOpaqueValue();
}		}

bool operator!=(const DwarfStringPoolEntryRef &X) const {		bool operator!=(const DwarfStringPoolEntryRef &X) const {
return MapEntry.getOpaqueValue() != X.MapEntry.getOpaqueValue();		return MapEntry.getOpaqueValue() != X.MapEntry.getOpaqueValue();
}		}
};		};

} // end namespace llvm		} // end namespace llvm

#endif		#endif

llvm/include/llvm/DWARFLinker/DWARFLinker.h

	Show First 20 Lines • Show All 264 Lines • ▼ Show 20 Lines

	class DwarfStreamer;			class DwarfStreamer;
	using UnitListTy = std::vector<std::unique_ptr<CompileUnit>>;			using UnitListTy = std::vector<std::unique_ptr<CompileUnit>>;

	/// This class represents DWARF information for source file			/// This class represents DWARF information for source file
	/// and its address map.			/// and its address map.
	class DWARFFile {			class DWARFFile {
	public:			public:
				using UnloadCallbackTy = std::function<void(StringRef FileName)>;
	DWARFFile(StringRef Name, std::unique_ptr<DWARFContext> Dwarf,			DWARFFile(StringRef Name, std::unique_ptr<DWARFContext> Dwarf,
	std::unique_ptr<AddressesMap> Addresses,			std::unique_ptr<AddressesMap> Addresses,
	const std::vector<std::string> &Warnings)			const std::vector<std::string> &Warnings,
				UnloadCallbackTy = nullptr)
	: FileName(Name), Dwarf(std::move(Dwarf)),			: FileName(Name), Dwarf(std::move(Dwarf)),
	Addresses(std::move(Addresses)), Warnings(Warnings) {}			Addresses(std::move(Addresses)), Warnings(Warnings) {}

	/// The object file name.			/// The object file name.
	StringRef FileName;			StringRef FileName;

	/// The source DWARF information.			/// The source DWARF information.
	std::unique_ptr<DWARFContext> Dwarf;			std::unique_ptr<DWARFContext> Dwarf;
	▲ Show 20 Lines • Show All 668 Lines • Show Last 20 Lines

llvm/include/llvm/DWARFLinkerParallel/AddressesMap.h

//===- AddressesMap.h -------------------------------------------- C++ --===//		//===- AddressesMap.h -------------------------------------------- C++ --===//
//		//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.		// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.		// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception		// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//		//
//===----------------------------------------------------------------------===//		//===----------------------------------------------------------------------===//

#ifndef LLVM_DWARFLINKERPARALLEL_ADDRESSESMAP_H		#ifndef LLVM_DWARFLINKERPARALLEL_ADDRESSESMAP_H
#define LLVM_DWARFLINKERPARALLEL_ADDRESSESMAP_H		#define LLVM_DWARFLINKERPARALLEL_ADDRESSESMAP_H

#include "llvm/ADT/AddressRanges.h"		#include "llvm/ADT/AddressRanges.h"
		#include "llvm/DebugInfo/DWARF/DWARFContext.h"
#include "llvm/DebugInfo/DWARF/DWARFDie.h"		#include "llvm/DebugInfo/DWARF/DWARFDie.h"
#include "llvm/DebugInfo/DWARF/DWARFExpression.h"		#include "llvm/DebugInfo/DWARF/DWARFExpression.h"
		#include "llvm/DebugInfo/DWARF/DWARFUnit.h"
#include <cstdint>		#include <cstdint>

namespace llvm {		namespace llvm {
namespace dwarflinker_parallel {		namespace dwarflinker_parallel {

/// Mapped value in the address map is the offset to apply to the		/// Mapped value in the address map is the offset to apply to the
/// linked address.		/// linked address.
using RangesTy = AddressRangesMap;		using RangesTy = AddressRangesMap;
Show All 34 Lines	public:
/// account that Data is at \p BaseOffset in the .debug_info section.		/// account that Data is at \p BaseOffset in the .debug_info section.
///		///
/// \returns true whether any reloc has been applied.		/// \returns true whether any reloc has been applied.
virtual bool applyValidRelocs(MutableArrayRef<char> Data, uint64_t BaseOffset,		virtual bool applyValidRelocs(MutableArrayRef<char> Data, uint64_t BaseOffset,
bool IsLittleEndian) = 0;		bool IsLittleEndian) = 0;

/// Erases all data.		/// Erases all data.
virtual void clear() = 0;		virtual void clear() = 0;

		/// This function checks whether variable has DWARF expression containing
		/// operation referencing live address(f.e. DW_OP_addr, DW_OP_addrx...).
		/// \returns first is true if the expression has an operation referencing an
		/// address.
		/// second is the relocation adjustment value if the live address is
		/// referenced.
		std::pair<bool, std::optional<int64_t>>
		getVariableRelocAdjustment(const DWARFDie &DIE) {
		assert((DIE.getTag() == dwarf::DW_TAG_variable \|\|
		DIE.getTag() == dwarf::DW_TAG_constant) &&
		"Wrong type of input die");

		const auto *Abbrev = DIE.getAbbreviationDeclarationPtr();

		// Check if DIE has DW_AT_location attribute.
		DWARFUnit *U = DIE.getDwarfUnit();
		std::optional<uint32_t> LocationIdx =
		Abbrev->findAttributeIndex(dwarf::DW_AT_location);
		if (!LocationIdx)
		return std::make_pair(false, std::nullopt);

		// Get offset to the DW_AT_location attribute.
		uint64_t AttrOffset =
		Abbrev->getAttributeOffsetFromIndex(LocationIdx, DIE.getOffset(), U);

		// Get value of the DW_AT_location attribute.
		std::optional<DWARFFormValue> LocationValue =
		Abbrev->getAttributeValueFromOffset(LocationIdx, AttrOffset, U);
		if (!LocationValue)
		return std::make_pair(false, std::nullopt);

		// Check that DW_AT_location attribute is of 'exprloc' class.
		// Handling value of location expressions for attributes of 'loclist'
		// class is not implemented yet.
		std::optional<ArrayRef<uint8_t>> Expr = LocationValue->getAsBlock();
		if (!Expr)
		return std::make_pair(false, std::nullopt);

		// Parse 'exprloc' expression.
		DataExtractor Data(toStringRef(*Expr), U->getContext().isLittleEndian(),
		U->getAddressByteSize());
		DWARFExpression Expression(Data, U->getAddressByteSize(),
		U->getFormParams().Format);

		bool HasLocationAddress = false;
		uint64_t CurExprOffset = 0;
		for (DWARFExpression::iterator It = Expression.begin();
		It != Expression.end(); ++It) {
		DWARFExpression::iterator NextIt = It;
		++NextIt;

		const DWARFExpression::Operation &Op = *It;
		switch (Op.getCode()) {
		case dwarf::DW_OP_const2u:
		case dwarf::DW_OP_const4u:
		case dwarf::DW_OP_const8u:
		case dwarf::DW_OP_const2s:
		case dwarf::DW_OP_const4s:
		case dwarf::DW_OP_const8s:
		if (NextIt == Expression.end() \|\| !isTlsAddressCode(NextIt->getCode()))
		break;
		[[fallthrough]];
		case dwarf::DW_OP_addr: {
		HasLocationAddress = true;
		// Check relocation for the address.
		if (std::optional<int64_t> RelocAdjustment =
		getExprOpAddressRelocAdjustment(*U, Op,
		AttrOffset + CurExprOffset,
		AttrOffset + Op.getEndOffset()))
		return std::make_pair(HasLocationAddress, *RelocAdjustment);
		} break;
		case dwarf::DW_OP_constx:
		case dwarf::DW_OP_addrx: {
		HasLocationAddress = true;
		if (std::optional<uint64_t> AddressOffset =
		DIE.getDwarfUnit()->getIndexedAddressOffset(
		Op.getRawOperand(0))) {
		// Check relocation for the address.
		if (std::optional<int64_t> RelocAdjustment =
		getExprOpAddressRelocAdjustment(
		U, Op, AddressOffset,
		*AddressOffset +
		DIE.getDwarfUnit()->getAddressByteSize()))
		return std::make_pair(HasLocationAddress, *RelocAdjustment);
		}
		} break;
		default: {
		// Nothing to do.
		} break;
		}
		CurExprOffset = Op.getEndOffset();
		}

		return std::make_pair(HasLocationAddress, std::nullopt);
		}

		protected:
		inline bool isTlsAddressCode(uint8_t DW_OP_Code) {
		return DW_OP_Code == dwarf::DW_OP_form_tls_address \|\|
		DW_OP_Code == dwarf::DW_OP_GNU_push_tls_address;
		}
};		};

} // end of namespace dwarflinker_parallel		} // end of namespace dwarflinker_parallel
} // end namespace llvm		} // end namespace llvm

#endif // LLVM_DWARFLINKERPARALLEL_ADDRESSESMAP_H		#endif // LLVM_DWARFLINKERPARALLEL_ADDRESSESMAP_H

llvm/include/llvm/DWARFLinkerParallel/DWARFFile.h

	Show All 24 Lines
	/// May be used asynchroniously for reading.			/// May be used asynchroniously for reading.
	class DWARFFile {			class DWARFFile {
	public:			public:
	using UnloadCallbackTy = std::function<void(StringRef FileName)>;			using UnloadCallbackTy = std::function<void(StringRef FileName)>;

	DWARFFile(StringRef Name, std::unique_ptr<DWARFContext> Dwarf,			DWARFFile(StringRef Name, std::unique_ptr<DWARFContext> Dwarf,
	std::unique_ptr<AddressesMap> Addresses,			std::unique_ptr<AddressesMap> Addresses,
	const std::vector<std::string> &Warnings,			const std::vector<std::string> &Warnings,
	UnloadCallbackTy UnloadFunc = nullptr)			UnloadCallbackTy UnloadFunc = nullptr);
	: FileName(Name), Dwarf(std::move(Dwarf)),
	Addresses(std::move(Addresses)), Warnings(Warnings),
	UnloadFunc(UnloadFunc) {
	if (this->Dwarf)
	Endianess = this->Dwarf->isLittleEndian() ? support::endianness::little
	: support::endianness::big;
	}

	/// Object file name.			/// Object file name.
	StringRef FileName;			StringRef FileName;

	/// Source DWARF information.			/// Source DWARF information.
	std::unique_ptr<DWARFContext> Dwarf;			std::unique_ptr<DWARFContext> Dwarf;

	/// Helpful address information(list of valid address ranges, relocations).			/// Helpful address information(list of valid address ranges, relocations).
	std::unique_ptr<AddressesMap> Addresses;			std::unique_ptr<AddressesMap> Addresses;

	/// Warnings for object file.			/// Warnings for object file.
	const std::vector<std::string> &Warnings;			const std::vector<std::string> &Warnings;

	/// Endiannes of source DWARF information.
	support::endianness Endianess = support::endianness::little;

	/// Callback to the module keeping object file to unload.			/// Callback to the module keeping object file to unload.
	UnloadCallbackTy UnloadFunc;			UnloadCallbackTy UnloadFunc;

	/// Unloads object file and corresponding AddressesMap and Dwarf Context.			/// Unloads object file and corresponding AddressesMap and Dwarf Context.
	void unload() {			void unload() {
	Addresses.reset();			Addresses.reset();
	Dwarf.reset();			Dwarf.reset();

	Show All 9 Lines

llvm/include/llvm/DWARFLinkerParallel/StringPool.h

Show All 15 Lines
#include <string>		#include <string>
#include <string_view>		#include <string_view>

namespace llvm {		namespace llvm {
namespace dwarflinker_parallel {		namespace dwarflinker_parallel {

/// StringEntry keeps data of the string: the length, external offset		/// StringEntry keeps data of the string: the length, external offset
/// and a string body which is placed right after StringEntry.		/// and a string body which is placed right after StringEntry.
using StringEntry = StringMapEntry<DwarfStringPoolEntry *>;		using StringEntry = StringMapEntry<std::nullopt_t>;

class StringPoolEntryInfo {		class StringPoolEntryInfo {
public:		public:
/// \returns Hash value for the specified \p Key.		/// \returns Hash value for the specified \p Key.
static inline uint64_t getHashValue(const StringRef &Key) {		static inline uint64_t getHashValue(const StringRef &Key) {
return xxh3_64bits(Key);		return xxh3_64bits(Key);
}		}

Show All 26 Lines	public:

StringPool(size_t InitialSize)		StringPool(size_t InitialSize)
: ConcurrentHashTableByPtr<StringRef, StringEntry,		: ConcurrentHashTableByPtr<StringRef, StringEntry,
parallel::PerThreadBumpPtrAllocator,		parallel::PerThreadBumpPtrAllocator,
StringPoolEntryInfo>(Allocator, InitialSize) {}		StringPoolEntryInfo>(Allocator, InitialSize) {}

parallel::PerThreadBumpPtrAllocator &getAllocatorRef() { return Allocator; }		parallel::PerThreadBumpPtrAllocator &getAllocatorRef() { return Allocator; }

		void clear() { Allocator.Reset(); }

private:		private:
parallel::PerThreadBumpPtrAllocator Allocator;		parallel::PerThreadBumpPtrAllocator Allocator;
};		};

} // end of namespace dwarflinker_parallel		} // end of namespace dwarflinker_parallel
} // end namespace llvm		} // end namespace llvm

#endif // LLVM_DWARFLINKERPARALLEL_STRINGPOOL_H		#endif // LLVM_DWARFLINKERPARALLEL_STRINGPOOL_H

llvm/include/llvm/DWARFLinkerParallel/StringTable.h

This file was deleted.

	//===- StringTable.h --------------------------------------------- C++ --===//
	//
	// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
	// See https://llvm.org/LICENSE.txt for license information.
	// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
	//
	//===----------------------------------------------------------------------===//

	#ifndef LLVM_DWARFLINKERPARALLEL_STRINGTABLE_H
	#define LLVM_DWARFLINKERPARALLEL_STRINGTABLE_H

	#include "llvm/ADT/SmallVector.h"
	#include "llvm/DWARFLinkerParallel/StringPool.h"

	namespace llvm {
	namespace dwarflinker_parallel {

	using StringsVector = SmallVector<StringEntry *>;

	/// This class prepares strings for emission into .debug_str table:
	/// translates string if necessary, assigns index and offset, keeps in order.
	class StringTable {
	public:
	StringTable(StringPool &Strings,
	std::function<StringRef(StringRef)> StringsTranslator)
	: Strings(Strings), StringsTranslator(StringsTranslator) {}
	~StringTable() {}

	/// Add string to the vector of strings which should be emitted.
	/// Translate input string if neccessary, assign index and offset.
	/// \returns updated string entry.
	StringEntry add(StringEntry String) {
	// Translate string if necessary.
	if (StringsTranslator)
	String = Strings.insert(StringsTranslator(String->first())).first;

	// Store String for emission and assign index and offset.
	if (String->getValue() == nullptr) {
	DwarfStringPoolEntry *NewEntry =
	Strings.getAllocatorRef().Allocate<DwarfStringPoolEntry>();

	NewEntry->Symbol = nullptr;
	NewEntry->Index = StringEntriesForEmission.size();

	if (StringEntriesForEmission.empty())
	NewEntry->Offset = 0;
	else {
	StringEntry *PrevString = StringEntriesForEmission.back();
	NewEntry->Offset =
	PrevString->getValue()->Offset + PrevString->getKeyLength() + 1;
	}

	String->getValue() = NewEntry;
	StringEntriesForEmission.push_back(String);
	}

	return String;
	}

	/// Erase contents of StringsForEmission.
	void clear() { StringEntriesForEmission.clear(); }

	/// Enumerate all strings in sequential order and call \p Handler for each
	/// string.
	void forEach(function_ref<void(DwarfStringPoolEntryRef)> Handler) const {
	for (const StringEntry *Entry : StringEntriesForEmission)
	Handler(*Entry);
	}

	std::function<StringRef(StringRef)> getTranslator() {
	return StringsTranslator;
	}

	protected:
	/// List of strings for emission.
	StringsVector StringEntriesForEmission;

	/// String pool for the translated strings.
	StringPool &Strings;

	/// Translator for the strings.
	std::function<StringRef(StringRef)> StringsTranslator;
	};

	} // end of namespace dwarflinker_parallel
	} // end namespace llvm

	#endif // LLVM_DWARFLINKERPARALLEL_STRINGTABLE_H

llvm/include/llvm/DebugInfo/DWARF/DWARFDebugMacro.h

	Show All 16 Lines

	namespace llvm {			namespace llvm {

	class raw_ostream;			class raw_ostream;
	class DwarfStreamer;			class DwarfStreamer;

	class DWARFDebugMacro {			class DWARFDebugMacro {
	friend DwarfStreamer;			friend DwarfStreamer;
				friend dwarflinker_parallel::CompileUnit;

	/// DWARFv5 section 6.3.1 Macro Information Header.			/// DWARFv5 section 6.3.1 Macro Information Header.
	enum HeaderFlagMask {			enum HeaderFlagMask {
	#define HANDLE_MACRO_FLAG(ID, NAME) MACRO_##NAME = ID,			#define HANDLE_MACRO_FLAG(ID, NAME) MACRO_##NAME = ID,
	#include "llvm/BinaryFormat/Dwarf.def"			#include "llvm/BinaryFormat/Dwarf.def"
	};			};
	struct MacroHeader {			struct MacroHeader {
	/// Macro version information number.			/// Macro version information number.
	▲ Show 20 Lines • Show All 114 Lines • Show Last 20 Lines

llvm/lib/DWARFLinker/DWARFLinker.cpp

Show First 20 Lines • Show All 438 Lines • ▼ Show 20 Lines	DWARFLinker::getVariableRelocAdjustment(AddressesMap &RelocMgr,
uint64_t CurExprOffset = 0;		uint64_t CurExprOffset = 0;
for (DWARFExpression::iterator It = Expression.begin();		for (DWARFExpression::iterator It = Expression.begin();
It != Expression.end(); ++It) {		It != Expression.end(); ++It) {
DWARFExpression::iterator NextIt = It;		DWARFExpression::iterator NextIt = It;
++NextIt;		++NextIt;

const DWARFExpression::Operation &Op = *It;		const DWARFExpression::Operation &Op = *It;
switch (Op.getCode()) {		switch (Op.getCode()) {
		case dwarf::DW_OP_const2u:
case dwarf::DW_OP_const4u:		case dwarf::DW_OP_const4u:
case dwarf::DW_OP_const8u:		case dwarf::DW_OP_const8u:
		case dwarf::DW_OP_const2s:
case dwarf::DW_OP_const4s:		case dwarf::DW_OP_const4s:
case dwarf::DW_OP_const8s:		case dwarf::DW_OP_const8s:
if (NextIt == Expression.end() \|\| !isTlsAddressCode(NextIt->getCode()))		if (NextIt == Expression.end() \|\| !isTlsAddressCode(NextIt->getCode()))
break;		break;
[[fallthrough]];		[[fallthrough]];
case dwarf::DW_OP_addr: {		case dwarf::DW_OP_addr: {
HasLocationAddress = true;		HasLocationAddress = true;
// Check relocation for the address.		// Check relocation for the address.
▲ Show 20 Lines • Show All 2,624 Lines • Show Last 20 Lines

llvm/lib/DWARFLinker/DWARFLinkerCompileUnit.cpp

Show First 20 Lines • Show All 91 Lines • ▼ Show 20 Lines	if (auto ExprLockBlock = Value->getAsBlock()) {
U->getFormParams().Format);		U->getFormParams().Format);

for (DWARFExpression::iterator It = Expression.begin();		for (DWARFExpression::iterator It = Expression.begin();
(It != Expression.end()) && !I.InDebugMap; ++It) {		(It != Expression.end()) && !I.InDebugMap; ++It) {
DWARFExpression::iterator NextIt = It;		DWARFExpression::iterator NextIt = It;
++NextIt;		++NextIt;

switch (It->getCode()) {		switch (It->getCode()) {
		case dwarf::DW_OP_const2u:
case dwarf::DW_OP_const4u:		case dwarf::DW_OP_const4u:
case dwarf::DW_OP_const8u:		case dwarf::DW_OP_const8u:
		case dwarf::DW_OP_const2s:
case dwarf::DW_OP_const4s:		case dwarf::DW_OP_const4s:
case dwarf::DW_OP_const8s:		case dwarf::DW_OP_const8s:
if (NextIt == Expression.end() \|\|		if (NextIt == Expression.end() \|\|
NextIt->getCode() != dwarf::DW_OP_form_tls_address)		NextIt->getCode() != dwarf::DW_OP_form_tls_address)
break;		break;
[[fallthrough]];		[[fallthrough]];
case dwarf::DW_OP_constx:		case dwarf::DW_OP_constx:
case dwarf::DW_OP_addr:		case dwarf::DW_OP_addr:
▲ Show 20 Lines • Show All 98 Lines • Show Last 20 Lines

llvm/lib/DWARFLinkerParallel/ArrayList.h

This file was added.

				//===- ArrayList.h ----------------------------------------------- C++ --===//
				//
				// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
				// See https://llvm.org/LICENSE.txt for license information.
				// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
				//
				//===----------------------------------------------------------------------===//

				#ifndef LLVM_LIB_DWARFLINKERPARALLEL_ARRAYLIST_H
				#define LLVM_LIB_DWARFLINKERPARALLEL_ARRAYLIST_H

				#include "DWARFLinkerGlobalData.h"
				#include "llvm/Support/PerThreadBumpPtrAllocator.h"

				namespace llvm {
				namespace dwarflinker_parallel {

				/// This class is a simple list of T structures. It keeps elements as
				/// pre-allocated groups to save memory for each element's next pointer.
				/// It allocates internal data using specified per-thread BumpPtrAllocator.
				template <typename T, size_t ItemsGroupSize = 512> class ArrayList {
				public:
				/// Copy specified \p Item into the list.
				T &noteItem(const T &Item) {
				assert(Allocator != nullptr);

				ItemsGroup *CurGroup = LastGroup;

				if (CurGroup == nullptr) {
				// Allocate first ItemsGroup.
				LastGroup = Allocator->Allocate<ItemsGroup>();
				LastGroup->ItemsCount = 0;
				LastGroup->Next = nullptr;
				GroupsHead = LastGroup;
				CurGroup = LastGroup;
				}

				if (CurGroup->ItemsCount == ItemsGroupSize) {
				// Allocate next ItemsGroup if current one is full.
				LastGroup = Allocator->Allocate<ItemsGroup>();
				LastGroup->ItemsCount = 0;
				LastGroup->Next = nullptr;
				CurGroup->Next = LastGroup;
				CurGroup = LastGroup;
				}

				// Copy item into the next position inside current ItemsGroup.
				CurGroup->Items[CurGroup->ItemsCount] = Item;
				return CurGroup->Items[CurGroup->ItemsCount++];
				}

				using ItemHandlerTy = function_ref<void(T &)>;

				/// Enumerate all items and apply specified \p Handler to each.
				void forEach(ItemHandlerTy Handler) {
				for (ItemsGroup *CurGroup = GroupsHead; CurGroup != nullptr;
				CurGroup = CurGroup->Next) {
				for (size_t Idx = 0; Idx < CurGroup->ItemsCount; Idx++) {
				Handler(CurGroup->Items[Idx]);
				}
				}
				}

				/// Check whether list is empty.
				bool empty() { return GroupsHead == nullptr; }

				/// Erase list.
				void erase() {
				GroupsHead = nullptr;
				LastGroup = nullptr;
				}

				void setAllocator(parallel::PerThreadBumpPtrAllocator *Allocator) {
				this->Allocator = Allocator;
				}

				protected:
				struct ItemsGroup {
				std::array<T, ItemsGroupSize> Items;
				ItemsGroup *Next = nullptr;
				size_t ItemsCount = 0;
				};

				ItemsGroup *GroupsHead = nullptr;
				ItemsGroup *LastGroup = nullptr;
				parallel::PerThreadBumpPtrAllocator *Allocator = nullptr;
				};

				} // end of namespace dwarflinker_parallel
				} // end namespace llvm

				#endif // LLVM_LIB_DWARFLINKERPARALLEL_ARRAYLIST_H

llvm/lib/DWARFLinkerParallel/CMakeLists.txt

	add_llvm_component_library(LLVMDWARFLinkerParallel			add_llvm_component_library(LLVMDWARFLinkerParallel
				DependencyTracker.cpp
				DIEAttributeCloner.cpp
	DWARFEmitterImpl.cpp			DWARFEmitterImpl.cpp
				DWARFFile.cpp
	DWARFLinker.cpp			DWARFLinker.cpp
				DWARFLinkerCompileUnit.cpp
	DWARFLinkerImpl.cpp			DWARFLinkerImpl.cpp
				DWARFLinkerUnit.cpp
	OutputSections.cpp			OutputSections.cpp
	StringPool.cpp			StringPool.cpp

	ADDITIONAL_HEADER_DIRS			ADDITIONAL_HEADER_DIRS
	${LLVM_MAIN_INCLUDE_DIR}/llvm/DWARFLinkerParallel			${LLVM_MAIN_INCLUDE_DIR}/llvm/DWARFLinkerParallel

	DEPENDS			DEPENDS
	intrinsics_gen			intrinsics_gen
	Show All 11 Lines

llvm/lib/DWARFLinkerParallel/DIEAttributeCloner.h

This file was added.

//===- DIEAttributeCloner.h -------------------------------------*- C++ -*-===//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//===----------------------------------------------------------------------===//

#ifndef LLVM_LIB_DWARFLINKERPARALLEL_DIEATTRIBUTECLONER_H

#define LLVM_LIB_DWARFLINKERPARALLEL_DIEATTRIBUTECLONER_H

#include "ArrayList.h"

#include "DIEGenerator.h"

#include "DWARFLinkerCompileUnit.h"

#include "DWARFLinkerGlobalData.h"

namespace llvm {

namespace dwarflinker_parallel {

/// This class creates clones of input DIE attributes.

/// It enumerates attributes of input DIE, creates clone for each

/// attribute, adds cloned attribute to the output DIE.

class DIEAttributeCloner {

public:

DIEAttributeCloner(DIE *OutDIE, CompileUnit &CU,

const DWARFDebugInfoEntry *InputDieEntry,

DIEGenerator &Generator,

std::optional<int64_t> FuncAddressAdjustment,

std::optional<int64_t> VarAddressAdjustment,

bool HasLocationExpressionAddress)

: OutDIE(OutDIE), CU(CU),

DebugInfoOutputSection(

CU.getOrCreateSectionDescriptor(DebugSectionKind::DebugInfo)),

InputDieEntry(InputDieEntry), Generator(Generator),

FuncAddressAdjustment(FuncAddressAdjustment),

VarAddressAdjustment(VarAddressAdjustment),

HasLocationExpressionAddress(HasLocationExpressionAddress) {

InputDIEIdx = CU.getDIEIndex(InputDieEntry);

}

/// Clone attributes of input DIE.

void clone();

/// Create abbreviations for the output DIE after all attributes are cloned.

unsigned finalizeAbbreviations(bool HasChildrenToClone);

/// Information gathered and exchanged between the various

/// clone*Attr helpers about the attributes of a particular DIE.

JDevlieghereUnsubmitted

Not Done

/// handle*Attr helpers about the attributes of a particular DIE.

///

- /// Can not be used asynchroniously.

+ /// Cannot be used concurrently.

struct AttributesInfo {

JDevlieghere:

///

/// Cannot be used concurrently.

struct AttributesInfo {

/// Names.

StringEntry *Name = nullptr;

StringEntry *MangledName = nullptr;

StringEntry *NameWithoutTemplate = nullptr;

/// Does the DIE have a low_pc attribute?

bool HasLowPc = false;

/// Is this DIE only a declaration?

bool IsDeclaration = false;

/// Does the DIE have a ranges attribute?

bool HasRanges = false;

/// Does the DIE have a string offset attribute?

bool HasStringOffsetBaseAttr = false;

};

JDevlieghereUnsubmitted

Not Done

Let's make these Doxygen style comments as well.

JDevlieghere: Let's make these Doxygen style comments as well.

AttributesInfo AttrInfo;

protected:

/// Clone string attribute.

size_t

cloneStringAttr(const DWARFFormValue &Val,