Diff 373134

lld/MachO/ICF.cpp

Show First 20 Lines • Show All 170 Lines • ▼ Show 20 Lines	if (ra.referent.is<Symbol *>()) {
const auto sb = rb.referent.get<InputSection >();		const auto sb = rb.referent.get<InputSection >();
isecA = dyn_cast<ConcatInputSection>(sa);		isecA = dyn_cast<ConcatInputSection>(sa);
if (!isecA)		if (!isecA)
return true;		return true;
isecB = cast<ConcatInputSection>(sb);		isecB = cast<ConcatInputSection>(sb);
}		}
return isecA->icfEqClass[icfPass % 2] == isecB->icfEqClass[icfPass % 2];		return isecA->icfEqClass[icfPass % 2] == isecB->icfEqClass[icfPass % 2];
};		};
return std::equal(ia->relocs.begin(), ia->relocs.end(), ib->relocs.begin(),		if (!std::equal(ia->relocs.begin(), ia->relocs.end(), ib->relocs.begin(), f))
f);		return false;

		// If there are symbols with associated unwind info, check that the unwind
		// info matches. For simplicity, we only handle the case where there are only
		// symbols at offset zero within the section (which is typically the case with
		// .subsections_via_symbols.)
		auto hasCU = [](Defined *d) { return d->compactUnwind; };
		auto itA = std::find_if(ia->symbols.begin(), ia->symbols.end(), hasCU);
		auto itB = std::find_if(ib->symbols.begin(), ib->symbols.end(), hasCU);
		if (itA == ia->symbols.end())
		return itB == ib->symbols.end();
		if (itB == ib->symbols.end())
		return false;
		const Defined da = itA;
		const Defined db = itB;
		if (da->compactUnwind->icfEqClass[icfPass % 2] !=
		db->compactUnwind->icfEqClass[icfPass % 2] \|\|
		da->value != 0 \|\| db->value != 0)
		return false;
		auto isZero = [](Defined *d) { return d->value == 0; };
		return std::find_if_not(std::next(itA), ia->symbols.end(), isZero) ==
		ia->symbols.end() &&
		std::find_if_not(std::next(itB), ib->symbols.end(), isZero) ==
		ib->symbols.end();
}		}

// Find the first InputSection after BEGIN whose equivalence class differs		// Find the first InputSection after BEGIN whose equivalence class differs
size_t ICF::findBoundary(size_t begin, size_t end) {		size_t ICF::findBoundary(size_t begin, size_t end) {
uint64_t beginHash = icfInputs[begin]->icfEqClass[icfPass % 2];		uint64_t beginHash = icfInputs[begin]->icfEqClass[icfPass % 2];
for (size_t i = begin + 1; i < end; ++i)		for (size_t i = begin + 1; i < end; ++i)
if (beginHash != icfInputs[i]->icfEqClass[icfPass % 2])		if (beginHash != icfInputs[i]->icfEqClass[icfPass % 2])
return i;		return i;
▲ Show 20 Lines • Show All 140 Lines • ▼ Show 20 Lines	void macho::foldIdenticalSections() {
// ICF::segregate()		// ICF::segregate()
std::vector<ConcatInputSection *> hashable;		std::vector<ConcatInputSection *> hashable;
uint64_t icfUniqueID = inputSections.size();		uint64_t icfUniqueID = inputSections.size();
for (ConcatInputSection *isec : inputSections) {		for (ConcatInputSection *isec : inputSections) {
// FIXME: consider non-code __text sections as hashable?		// FIXME: consider non-code __text sections as hashable?
bool isHashable = (isCodeSection(isec) \|\| isCfStringSection(isec)) &&		bool isHashable = (isCodeSection(isec) \|\| isCfStringSection(isec)) &&
!isec->shouldOmitFromOutput() &&		!isec->shouldOmitFromOutput() &&
isec->isHashableForICF();		isec->isHashableForICF();
// ICF can't fold functions with unwind info		if (isHashable) {
if (isHashable)
for (Defined *d : isec->symbols)
if (d->compactUnwind) {
isHashable = false;
break;
}

if (isHashable)
hashable.push_back(isec);		hashable.push_back(isec);
else		for (Defined *d : isec->symbols)
		if (d->compactUnwind)
		hashable.push_back(d->compactUnwind);
		} else {
isec->icfEqClass[0] = ++icfUniqueID;		isec->icfEqClass[0] = ++icfUniqueID;
}		}
		}
parallelForEach(hashable,		parallelForEach(hashable,
[](ConcatInputSection *isec) { isec->hashForICF(); });		[](ConcatInputSection *isec) { isec->hashForICF(); });
// Now that every input section is either hashed or marked as unique, run the		// Now that every input section is either hashed or marked as unique, run the
// segregation algorithm to detect foldable subsections.		// segregation algorithm to detect foldable subsections.
ICF(hashable).run();		ICF(hashable).run();
}		}

lld/MachO/InputFiles.cpp

Show First 20 Lines • Show All 886 Lines • ▼ Show 20 Lines	for (SubsectionMap &map : subsections) {
cuSubsecMap = &map;		cuSubsecMap = &map;
break;		break;
}		}
if (!cuSubsecMap)		if (!cuSubsecMap)
return;		return;

for (SubsectionEntry &entry : *cuSubsecMap) {		for (SubsectionEntry &entry : *cuSubsecMap) {
ConcatInputSection *isec = cast<ConcatInputSection>(entry.isec);		ConcatInputSection *isec = cast<ConcatInputSection>(entry.isec);
		// Hack!! Since each CUE contains a different function address, if ICF
		// operated naively and compared the entire contents of each CUE, entries
		// with identical unwind info but belonging to different functions would
		// never be considered equivalent. To work around this problem, we slice
		// away the function address here. (Note that we do not adjust the offsets
		// of the corresponding relocations.) We rely on `relocateCompactUnwind()`
		// to correctly handle these truncated input sections.
		isec->data = isec->data.slice(target->wordSize);

ConcatInputSection *referentIsec;		ConcatInputSection *referentIsec;
for (const Reloc &r : isec->relocs) {		for (auto it = isec->relocs.begin(); it != isec->relocs.end();) {
if (r.offset != 0)		Reloc &r = *it;
		// We only wish to handle the relocation for CUE::functionAddress.
		if (r.offset != 0) {
		++it;
continue;		continue;
		}
uint64_t add = r.addend;		uint64_t add = r.addend;
if (auto sym = cast_or_null<Defined>(r.referent.dyn_cast<Symbol >())) {		if (auto sym = cast_or_null<Defined>(r.referent.dyn_cast<Symbol >())) {
add += sym->value;		add += sym->value;
referentIsec = cast<ConcatInputSection>(sym->isec);		referentIsec = cast<ConcatInputSection>(sym->isec);
} else {		} else {
referentIsec =		referentIsec =
cast<ConcatInputSection>(r.referent.dyn_cast<InputSection *>());		cast<ConcatInputSection>(r.referent.dyn_cast<InputSection *>());
}		}
		if (referentIsec->getSegName() != segment_names::text)
		error("compact unwind references address in " + toString(referentIsec) +
		" which is not in segment __TEXT");
// The functionAddress relocations are typically section relocations.		// The functionAddress relocations are typically section relocations.
// However, unwind info operates on a per-symbol basis, so we search for		// However, unwind info operates on a per-symbol basis, so we search for
// the function symbol here.		// the function symbol here.
auto it = llvm::lower_bound(		auto symIt = llvm::lower_bound(
referentIsec->symbols, add,		referentIsec->symbols, add,
[](Defined *d, uint64_t add) { return d->value < add; });		[](Defined *d, uint64_t add) { return d->value < add; });
// The relocation should point at the exact address of a symbol (with no		// The relocation should point at the exact address of a symbol (with no
// addend).		// addend).
if (it == referentIsec->symbols.end() \|\| (*it)->value != add) {		if (symIt == referentIsec->symbols.end() \|\| (*symIt)->value != add) {
assert(referentIsec->wasCoalesced);		assert(referentIsec->wasCoalesced);
		++it;
continue;		continue;
}		}
(*it)->compactUnwind = isec;		(*symIt)->compactUnwind = isec;
		// Since we've sliced away the functionAddress, we should remove the
		// corresponding relocation too. Given that clang emits relocations in
		// reverse order of address, this relocation should be at the end of the
		// vector for most of our input object files, so this is typically an O(1)
		// operation.
		it = isec->relocs.erase(it);
}		}
}		}
}		}

// The path can point to either a dylib or a .tbd file.		// The path can point to either a dylib or a .tbd file.
static DylibFile loadDylib(StringRef path, DylibFile umbrella) {		static DylibFile loadDylib(StringRef path, DylibFile umbrella) {
Optional<MemoryBufferRef> mbref = readFile(path);		Optional<MemoryBufferRef> mbref = readFile(path);
if (!mbref) {		if (!mbref) {
▲ Show 20 Lines • Show All 512 Lines • Show Last 20 Lines

lld/MachO/UnwindInfoSection.cpp

Show First 20 Lines • Show All 268 Lines • ▼ Show 20 Lines	uint8_t buf = reinterpret_cast<uint8_t >(cuVector.data()) +
i * sizeof(CompactUnwindEntry<Ptr>);		i * sizeof(CompactUnwindEntry<Ptr>);
const Defined *d = symbolsVec[i].second;		const Defined *d = symbolsVec[i].second;
// Write the functionAddress.		// Write the functionAddress.
writeAddress(buf, d->getVA(), sizeof(Ptr) == 8 ? 3 : 2);		writeAddress(buf, d->getVA(), sizeof(Ptr) == 8 ? 3 : 2);
if (!d->compactUnwind)		if (!d->compactUnwind)
return;		return;

// Write the rest of the CUE.		// Write the rest of the CUE.
memcpy(buf, d->compactUnwind->data.data(), d->compactUnwind->data.size());		memcpy(buf + sizeof(Ptr), d->compactUnwind->data.data(),
		d->compactUnwind->data.size());
for (const Reloc &r : d->compactUnwind->relocs) {		for (const Reloc &r : d->compactUnwind->relocs) {
uint64_t referentVA = 0;		uint64_t referentVA = 0;
if (auto referentSym = r.referent.dyn_cast<Symbol >()) {		if (auto referentSym = r.referent.dyn_cast<Symbol >()) {
if (!isa<Undefined>(referentSym)) {		if (!isa<Undefined>(referentSym)) {
if (auto *defined = dyn_cast<Defined>(referentSym))		if (auto *defined = dyn_cast<Defined>(referentSym))
checkTextSegment(defined->isec);		checkTextSegment(defined->isec);
// At this point in the link, we may not yet know the final address of		// At this point in the link, we may not yet know the final address of
// the GOT, so we just encode the index. We make it a 1-based index so		// the GOT, so we just encode the index. We make it a 1-based index so
▲ Show 20 Lines • Show All 331 Lines • Show Last 20 Lines

lld/test/MachO/icf.s

Show All 26 Lines
# CHECK: [[#%x,WITH_ALT_ENTRY:]] l F __TEXT,__text _no_alt_entry		# CHECK: [[#%x,WITH_ALT_ENTRY:]] l F __TEXT,__text _no_alt_entry
# CHECK: [[#%x,DEFINED_REF_WITH_ADDEND_2:]] l F __TEXT,__text _defined_ref_with_addend_1		# CHECK: [[#%x,DEFINED_REF_WITH_ADDEND_2:]] l F __TEXT,__text _defined_ref_with_addend_1
# CHECK: [[#%x,DEFINED_REF_WITH_ADDEND_2:]] l F __TEXT,__text _defined_ref_with_addend_2		# CHECK: [[#%x,DEFINED_REF_WITH_ADDEND_2:]] l F __TEXT,__text _defined_ref_with_addend_2
# CHECK: [[#%x,RECURSIVE:]] l F __TEXT,__text _recursive		# CHECK: [[#%x,RECURSIVE:]] l F __TEXT,__text _recursive
# CHECK: [[#%x,CALL_RECURSIVE_2:]] l F __TEXT,__text _call_recursive_1		# CHECK: [[#%x,CALL_RECURSIVE_2:]] l F __TEXT,__text _call_recursive_1
# CHECK: [[#%x,CALL_RECURSIVE_2:]] l F __TEXT,__text _call_recursive_2		# CHECK: [[#%x,CALL_RECURSIVE_2:]] l F __TEXT,__text _call_recursive_2
# CHECK: [[#%x,CHECK_LENGTH_1:]] l F __TEXT,__text _check_length_1		# CHECK: [[#%x,CHECK_LENGTH_1:]] l F __TEXT,__text _check_length_1
# CHECK: [[#%x,CHECK_LENGTH_2:]] l F __TEXT,__text _check_length_2		# CHECK: [[#%x,CHECK_LENGTH_2:]] l F __TEXT,__text _check_length_2
# CHECK: [[#%x,HAS_UNWIND_1:]] l F __TEXT,__text _has_unwind_1		# CHECK: [[#%x,HAS_UNWIND_2:]] l F __TEXT,__text _has_unwind_1
# CHECK: [[#%x,HAS_UNWIND_2:]] l F __TEXT,__text _has_unwind_2		# CHECK: [[#%x,HAS_UNWIND_2:]] l F __TEXT,__text _has_unwind_2
		# CHECK: [[#%x,HAS_UNWIND_3:]] l F __TEXT,__text _has_unwind_3
# CHECK: [[#%x,MUTALLY_RECURSIVE_2:]] l F __TEXT,__text _mutually_recursive_1		# CHECK: [[#%x,MUTALLY_RECURSIVE_2:]] l F __TEXT,__text _mutually_recursive_1
# CHECK: [[#%x,MUTALLY_RECURSIVE_2:]] l F __TEXT,__text _mutually_recursive_2		# CHECK: [[#%x,MUTALLY_RECURSIVE_2:]] l F __TEXT,__text _mutually_recursive_2
# CHECK: [[#%x,INIT_2:]] l F __TEXT,__text _init_1		# CHECK: [[#%x,INIT_2:]] l F __TEXT,__text _init_1
# CHECK: [[#%x,INIT_2:]] l F __TEXT,__text _init_2		# CHECK: [[#%x,INIT_2:]] l F __TEXT,__text _init_2
# CHECK: [[#%x,INIT_3:]] l O __TEXT,__foo _init_3		# CHECK: [[#%x,INIT_3:]] l O __TEXT,__foo _init_3
### FIXME: Mutually-recursive functions with identical bodies (see below)		### FIXME: Mutually-recursive functions with identical bodies (see below)
# COM: [[#%x,ASYMMETRIC_RECURSIVE_2:]] l F __TEXT,__text _asymmetric_recursive_1		# COM: [[#%x,ASYMMETRIC_RECURSIVE_2:]] l F __TEXT,__text _asymmetric_recursive_1
# COM: [[#%x,ASYMMETRIC_RECURSIVE_2]] l F __TEXT,__text _asymmetric_recursive_2		# COM: [[#%x,ASYMMETRIC_RECURSIVE_2]] l F __TEXT,__text _asymmetric_recursive_2
Show All 14 Lines
# CHECK: callq 0x[[#%x,WITH_ALT_ENTRY:]] <_with_alt_entry>		# CHECK: callq 0x[[#%x,WITH_ALT_ENTRY:]] <_with_alt_entry>
# CHECK: callq 0x[[#%x,DEFINED_REF_WITH_ADDEND_2:]] <_defined_ref_with_addend_2>		# CHECK: callq 0x[[#%x,DEFINED_REF_WITH_ADDEND_2:]] <_defined_ref_with_addend_2>
# CHECK: callq 0x[[#%x,DEFINED_REF_WITH_ADDEND_2:]] <_defined_ref_with_addend_2>		# CHECK: callq 0x[[#%x,DEFINED_REF_WITH_ADDEND_2:]] <_defined_ref_with_addend_2>
# CHECK: callq 0x[[#%x,RECURSIVE:]] <_recursive>		# CHECK: callq 0x[[#%x,RECURSIVE:]] <_recursive>
# CHECK: callq 0x[[#%x,CALL_RECURSIVE_2:]] <_call_recursive_2>		# CHECK: callq 0x[[#%x,CALL_RECURSIVE_2:]] <_call_recursive_2>
# CHECK: callq 0x[[#%x,CALL_RECURSIVE_2:]] <_call_recursive_2>		# CHECK: callq 0x[[#%x,CALL_RECURSIVE_2:]] <_call_recursive_2>
# CHECK: callq 0x[[#%x,CHECK_LENGTH_1:]] <_check_length_1>		# CHECK: callq 0x[[#%x,CHECK_LENGTH_1:]] <_check_length_1>
# CHECK: callq 0x[[#%x,CHECK_LENGTH_2:]] <_check_length_2>		# CHECK: callq 0x[[#%x,CHECK_LENGTH_2:]] <_check_length_2>
# CHECK: callq 0x[[#%x,HAS_UNWIND_1:]] <_has_unwind_1>
# CHECK: callq 0x[[#%x,HAS_UNWIND_2:]] <_has_unwind_2>		# CHECK: callq 0x[[#%x,HAS_UNWIND_2:]] <_has_unwind_2>
		# CHECK: callq 0x[[#%x,HAS_UNWIND_2:]] <_has_unwind_2>
		# CHECK: callq 0x[[#%x,HAS_UNWIND_3:]] <_has_unwind_3>
# CHECK: callq 0x[[#%x,MUTALLY_RECURSIVE_2:]] <_mutually_recursive_2>		# CHECK: callq 0x[[#%x,MUTALLY_RECURSIVE_2:]] <_mutually_recursive_2>
# CHECK: callq 0x[[#%x,MUTALLY_RECURSIVE_2:]] <_mutually_recursive_2>		# CHECK: callq 0x[[#%x,MUTALLY_RECURSIVE_2:]] <_mutually_recursive_2>
## FIXME: Mutually-recursive functions with identical bodies (see below)		## FIXME: Mutually-recursive functions with identical bodies (see below)
# COM: callq 0x[[#%x,ASYMMETRIC_RECURSIVE_2]] <_asymmetric_recursive_2>		# COM: callq 0x[[#%x,ASYMMETRIC_RECURSIVE_2]] <_asymmetric_recursive_2>
# COM: callq 0x[[#%x,ASYMMETRIC_RECURSIVE_2]] <_asymmetric_recursive_2>		# COM: callq 0x[[#%x,ASYMMETRIC_RECURSIVE_2]] <_asymmetric_recursive_2>
# CHECK: callq 0x[[#%x,INIT_2:]] <_init_2>		# CHECK: callq 0x[[#%x,INIT_2:]] <_init_2>
# CHECK: callq 0x[[#%x,INIT_2:]] <_init_2>		# CHECK: callq 0x[[#%x,INIT_2:]] <_init_2>
# CHECK: callq 0x[[#%x,INIT_3:]] <_init_3>		# CHECK: callq 0x[[#%x,INIT_3:]] <_init_3>
▲ Show 20 Lines • Show All 88 Lines • ▼ Show 20 Lines

_check_length_2:		_check_length_2:
movq $97, %rax		movq $97, %rax
.space 1		.space 1

_my_personality:		_my_personality:
mov $1345, %rax		mov $1345, %rax

## No fold: functions have unwind info.		## Functions with identical unwind info should be folded.
## FIXME: Fold functions with identical unwind info.
_has_unwind_1:		_has_unwind_1:
.cfi_startproc		.cfi_startproc
.cfi_personality 155, _my_personality		.cfi_personality 155, _my_personality
.cfi_def_cfa_offset 16		.cfi_def_cfa_offset 16
ret		ret
.cfi_endproc		.cfi_endproc

_has_unwind_2:		_has_unwind_2:
.cfi_startproc		.cfi_startproc
.cfi_personality 155, _my_personality		.cfi_personality 155, _my_personality
.cfi_def_cfa_offset 16		.cfi_def_cfa_offset 16
ret		ret
.cfi_endproc		.cfi_endproc

		## This function has different unwind info from the preceding two, and therefore
		## should not be folded.
		_has_unwind_3:
		.cfi_startproc
		.cfi_personality 155, _my_personality
		.cfi_def_cfa_offset 8
		ret
		.cfi_endproc

## Fold: Mutually-recursive functions with symmetric bodies		## Fold: Mutually-recursive functions with symmetric bodies
_mutually_recursive_1:		_mutually_recursive_1:
callq _mutually_recursive_1 # call myself		callq _mutually_recursive_1 # call myself
callq _mutually_recursive_2 # call my twin		callq _mutually_recursive_2 # call my twin

_mutually_recursive_2:		_mutually_recursive_2:
callq _mutually_recursive_2 # call myself		callq _mutually_recursive_2 # call myself
callq _mutually_recursive_1 # call my twin		callq _mutually_recursive_1 # call my twin
▲ Show 20 Lines • Show All 51 Lines • ▼ Show 20 Lines	_main:
callq _defined_ref_with_addend_2		callq _defined_ref_with_addend_2
callq _recursive		callq _recursive
callq _call_recursive_1		callq _call_recursive_1
callq _call_recursive_2		callq _call_recursive_2
callq _check_length_1		callq _check_length_1
callq _check_length_2		callq _check_length_2
callq _has_unwind_1		callq _has_unwind_1
callq _has_unwind_2		callq _has_unwind_2
		callq _has_unwind_3
callq _mutually_recursive_1		callq _mutually_recursive_1
callq _mutually_recursive_2		callq _mutually_recursive_2
callq _asymmetric_recursive_1		callq _asymmetric_recursive_1
callq _asymmetric_recursive_2		callq _asymmetric_recursive_2
callq _init_1		callq _init_1
callq _init_2		callq _init_2
callq _init_3		callq _init_3

lld/test/MachO/invalid/compact-unwind-bad-reloc.s

	# REQUIRES: x86			# REQUIRES: x86
	# RUN: llvm-mc -filetype=obj -triple=x86_64-apple-darwin19.0.0 %s -o %t.o			# RUN: rm -rf %t; split-file %s %t
	# RUN: not %lld -pie -lSystem -lc++ %t.o -o %t 2>&1 \| FileCheck %s -DFILE=%t.o			# RUN: llvm-mc -filetype=obj -triple=x86_64-apple-darwin19.0.0 %t/bad-function.s -o %t/bad-function.o
				# RUN: llvm-mc -filetype=obj -triple=x86_64-apple-darwin19.0.0 %t/bad-personality.s -o %t/bad-personality.o
				# RUN: not %lld -pie -lSystem -lc++ %t/bad-function.o -o %t 2>&1 \| FileCheck %s -DFILE=%t/bad-function.o
				# RUN: not %lld -pie -lSystem -lc++ %t/bad-personality.o -o %t 2>&1 \| FileCheck %s -DFILE=%t/bad-personality.o
	# CHECK: error: compact unwind references address in [[FILE]]:(__data) which is not in segment __TEXT			# CHECK: error: compact unwind references address in [[FILE]]:(__data) which is not in segment __TEXT

	.globl _main, _not_a_function			#--- bad-function.s
	.text
	_main:
	retq

	.data			.data
	_not_a_function:			_not_a_function:
	.cfi_startproc			.cfi_startproc
	.cfi_personality 155, ___gxx_personality_v0			.cfi_personality 155, ___gxx_personality_v0
	.cfi_def_cfa_offset 16			.cfi_def_cfa_offset 16
	retq			retq
	.cfi_endproc			.cfi_endproc

				#--- bad-personality.s
				.globl _main, _not_a_function
				.text
				_main:
				.cfi_startproc
				.cfi_personality 155, _my_personality
				.cfi_def_cfa_offset 16
				retq
				.cfi_endproc

				.data
				.globl _my_personality
				_my_personality:

This is an archive of the discontinued LLVM Phabricator instance.

[lld-macho] Teach ICF to dedup functions with identical unwind info
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 373134

lld/MachO/ICF.cpp

lld/MachO/InputFiles.cpp

lld/MachO/UnwindInfoSection.cpp

lld/test/MachO/icf.s

lld/test/MachO/invalid/compact-unwind-bad-reloc.s

This is an archive of the discontinued LLVM Phabricator instance.

[lld-macho] Teach ICF to dedup functions with identical unwind infoClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 373134

lld/MachO/ICF.cpp

lld/MachO/InputFiles.cpp

lld/MachO/UnwindInfoSection.cpp

lld/test/MachO/icf.s

lld/test/MachO/invalid/compact-unwind-bad-reloc.s

[lld-macho] Teach ICF to dedup functions with identical unwind info
ClosedPublic