This is an archive of the discontinued LLVM Phabricator instance.

Paths

Table of Contentst

-
llvm/
-
include/llvm/MC/
-
llvm/
-
MC/
-
MCPseudoProbe.h
-
lib/MC/
-
MC/
1/5
MCPseudoProbe.cpp
-
tools/llvm-profgen/
-
llvm-profgen/
-
ProfiledBinary.h
-
ProfiledBinary.cpp

Differential D115950

[llvm-profgen] Use shared string table for function name to save memory usage
AcceptedPublic

Authored by wlei on Dec 17 2021, 9:49 AM.

Download Raw Diff

Details

Reviewers

hoy
wenlei

Summary

Currently we have three maps all using function name std::string, a) FuncName in pseudo probe section(GUID2FuncDescMap) b) FuncName in debug info(BinaryFunctions) c) symbolizer (NameStrings). We can optimize to use one shared map and other two use StringRef to save memory usage.

Diff Detail

Repository: rG LLVM Github Monorepo

Unit TestsFailed

	Time	Test
	60 ms	x64 debian > LLVM.Bindings/Go::go.test

Event Timeline

wlei created this revision.Dec 17 2021, 9:49 AM

Herald added subscribers: hoy, wenlei, hiraditya. · View Herald TranscriptDec 17 2021, 9:49 AM

wlei requested review of this revision.Dec 17 2021, 9:49 AM

Herald added a project: Restricted Project. · View Herald TranscriptDec 17 2021, 9:49 AM

Herald added a subscriber: llvm-commits. · View Herald Transcript

wlei edited the summary of this revision. (Show Details)Dec 17 2021, 9:52 AM

wlei added reviewers: hoy, wenlei.

Harbormaster completed remote builds in B139866: Diff 395156.Dec 17 2021, 10:32 AM

wenlei added inline comments.Dec 17 2021, 11:10 AM

llvm/lib/MC/MCPseudoProbe.cpp
354	Just double checking, so the underlying data for probe section is freed after decoding? Where does that happen?

Thanks for the change. How much space do you see this helps save?

llvm/lib/MC/MCPseudoProbe.cpp
354	The real name is on the disk. When read, a temp object `ErrorOrName` is created which is then freed.

wenlei added inline comments.Dec 17 2021, 11:29 AM

llvm/lib/MC/MCPseudoProbe.cpp
354	ErrorOrName doesn't own the underlying data. I was asking about the underlying data. The data is MCPseudoProbeDecoder::Data. Is OwningBinary taking care of the freeing?

hoy added inline comments.Dec 17 2021, 11:35 AM

llvm/lib/MC/MCPseudoProbe.cpp
354	Yes, the binary object owns that underlying data buffer, i.e, pointed by `const uint8_t *Start`.

In D115950#3200422, @hoy wrote:

Thanks for the change. How much space do you see this helps save?

I just tested it on our search infra, surprisingly I didn't see any memory saved by this. I dived more and it showed that the FuncNameStrings is not a big consumer, only ~1GB compared to the total consumption (200GB+), that's petty small. Another guess is the library have some optimization to allocate the string memory, but I'm not quite familiar with underlying optimization of string allocation.

llvm/lib/MC/MCPseudoProbe.cpp
354	Yeah, the input binary info `OwningBinary<Binary> OBinary` is all freed after `load()` completed, otherwise we can directly use StringRef before.

It's still good to have this optimization, thanks.

This revision is now accepted and ready to land.Dec 17 2021, 3:05 PM

lgtm, thanks.

Revision Contents

Path

Size

llvm/

include/

llvm/

MC/

MCPseudoProbe.h

6 lines

lib/

MC/

MCPseudoProbe.cpp

9 lines

tools/

llvm-profgen/

ProfiledBinary.h

12 lines

ProfiledBinary.cpp

12 lines

Diff 395156

llvm/include/llvm/MC/MCPseudoProbe.h

Show First 20 Lines • Show All 49 Lines • ▼ Show 20 Lines
#include "llvm/Support/ErrorOr.h"		#include "llvm/Support/ErrorOr.h"
#include <list>		#include <list>
#include <map>		#include <map>
#include <memory>		#include <memory>
#include <string>		#include <string>
#include <tuple>		#include <tuple>
#include <type_traits>		#include <type_traits>
#include <unordered_map>		#include <unordered_map>
		#include <unordered_set>
#include <vector>		#include <vector>

namespace llvm {		namespace llvm {

class MCSection;		class MCSection;
class MCStreamer;		class MCStreamer;
class MCSymbol;		class MCSymbol;
class MCObjectStreamer;		class MCObjectStreamer;
class raw_ostream;		class raw_ostream;

enum class MCPseudoProbeFlag {		enum class MCPseudoProbeFlag {
// If set, indicates that the probe is encoded as an address delta		// If set, indicates that the probe is encoded as an address delta
// instead of a real code address.		// instead of a real code address.
AddressDelta = 0x1,		AddressDelta = 0x1,
};		};

// Function descriptor decoded from .pseudo_probe_desc section		// Function descriptor decoded from .pseudo_probe_desc section
struct MCPseudoProbeFuncDesc {		struct MCPseudoProbeFuncDesc {
uint64_t FuncGUID = 0;		uint64_t FuncGUID = 0;
uint64_t FuncHash = 0;		uint64_t FuncHash = 0;
std::string FuncName;		StringRef FuncName;

MCPseudoProbeFuncDesc(uint64_t GUID, uint64_t Hash, StringRef Name)		MCPseudoProbeFuncDesc(uint64_t GUID, uint64_t Hash, StringRef Name)
: FuncGUID(GUID), FuncHash(Hash), FuncName(Name){};		: FuncGUID(GUID), FuncHash(Hash), FuncName(Name){};

void print(raw_ostream &OS);		void print(raw_ostream &OS);
};		};

class MCPseudoProbe;		class MCPseudoProbe;
▲ Show 20 Lines • Show All 259 Lines • ▼ Show 20 Lines	class MCPseudoProbeDecoder {
// Decoding helper function		// Decoding helper function
template <typename T> ErrorOr<T> readUnencodedNumber();		template <typename T> ErrorOr<T> readUnencodedNumber();
template <typename T> ErrorOr<T> readUnsignedNumber();		template <typename T> ErrorOr<T> readUnsignedNumber();
template <typename T> ErrorOr<T> readSignedNumber();		template <typename T> ErrorOr<T> readSignedNumber();
ErrorOr<StringRef> readString(uint32_t Size);		ErrorOr<StringRef> readString(uint32_t Size);

public:		public:
// Decode pseudo_probe_desc section to build GUID to PseudoProbeFuncDesc map.		// Decode pseudo_probe_desc section to build GUID to PseudoProbeFuncDesc map.
bool buildGUID2FuncDescMap(const uint8_t *Start, std::size_t Size);		bool buildGUID2FuncDescMap(const uint8_t *Start, std::size_t Size,
		std::unordered_set<std::string> &FuncNameStrings);

// Decode pseudo_probe section to build address to probes map.		// Decode pseudo_probe section to build address to probes map.
bool buildAddress2ProbeMap(const uint8_t *Start, std::size_t Size);		bool buildAddress2ProbeMap(const uint8_t *Start, std::size_t Size);

// Print pseudo_probe_desc section info		// Print pseudo_probe_desc section info
void printGUID2FuncDescMap(raw_ostream &OS);		void printGUID2FuncDescMap(raw_ostream &OS);

// Print pseudo_probe section info, used along with show-disassembly		// Print pseudo_probe section info, used along with show-disassembly
▲ Show 20 Lines • Show All 43 Lines • Show Last 20 Lines

llvm/lib/MC/MCPseudoProbe.cpp

Show First 20 Lines • Show All 306 Lines • ▼ Show 20 Lines	ErrorOr<StringRef> MCPseudoProbeDecoder::readString(uint32_t Size) {
StringRef Str(reinterpret_cast<const char *>(Data), Size);		StringRef Str(reinterpret_cast<const char *>(Data), Size);
if (Data + Size > End) {		if (Data + Size > End) {
return std::error_code();		return std::error_code();
}		}
Data += Size;		Data += Size;
return ErrorOr<StringRef>(Str);		return ErrorOr<StringRef>(Str);
}		}

bool MCPseudoProbeDecoder::buildGUID2FuncDescMap(const uint8_t *Start,		bool MCPseudoProbeDecoder::buildGUID2FuncDescMap(
std::size_t Size) {		const uint8_t *Start, std::size_t Size,
		std::unordered_set<std::string> &FuncNameStrings) {
// The pseudo_probe_desc section has a format like:		// The pseudo_probe_desc section has a format like:
// .section .pseudo_probe_desc,"",@progbits		// .section .pseudo_probe_desc,"",@progbits
// .quad -5182264717993193164 // GUID		// .quad -5182264717993193164 // GUID
// .quad 4294967295 // Hash		// .quad 4294967295 // Hash
// .uleb 3 // Name size		// .uleb 3 // Name size
// .ascii "foo" // Name		// .ascii "foo" // Name
// .quad -2624081020897602054		// .quad -2624081020897602054
// .quad 174696971957		// .quad 174696971957
Show All 20 Lines	while (Data < End) {
auto ErrorOrName = readString(NameSize);		auto ErrorOrName = readString(NameSize);
if (!ErrorOrName)		if (!ErrorOrName)
return false;		return false;

uint64_t GUID = std::move(*ErrorOrGUID);		uint64_t GUID = std::move(*ErrorOrGUID);
uint64_t Hash = std::move(*ErrorOrHash);		uint64_t Hash = std::move(*ErrorOrHash);
StringRef Name = std::move(*ErrorOrName);		StringRef Name = std::move(*ErrorOrName);

		auto It = FuncNameStrings.insert(Name.str());
		wenleiUnsubmitted Not Done Reply Inline Actions Just double checking, so the underlying data for probe section is freed after decoding? Where does that happen? wenlei: Just double checking, so the underlying data for probe section is freed after decoding? Where…
		hoyUnsubmitted Not Done Reply Inline Actions The real name is on the disk. When read, a temp object `ErrorOrName` is created which is then freed. hoy: The real name is on the disk. When read, a temp object `ErrorOrName` is created which is then…
		wenleiUnsubmitted Not Done Reply Inline Actions ErrorOrName doesn't own the underlying data. I was asking about the underlying data. The data is MCPseudoProbeDecoder::Data. Is OwningBinary taking care of the freeing? wenlei: ErrorOrName doesn't own the underlying data. I was asking about the underlying data. The data…
		hoyUnsubmitted Not Done Reply Inline Actions Yes, the binary object owns that underlying data buffer, i.e, pointed by `const uint8_t Start`. hoy:* Yes, the binary object owns that underlying data buffer, i.e, pointed by `const uint8_t *Start`.
		wleiAuthorUnsubmitted Done Reply Inline Actions Yeah, the input binary info `OwningBinary<Binary> OBinary` is all freed after `load()` completed, otherwise we can directly use StringRef before. wlei: Yeah, the input binary info `OwningBinary<Binary> OBinary` is all freed after `load()`…
// Initialize PseudoProbeFuncDesc and populate it into GUID2FuncDescMap		// Initialize PseudoProbeFuncDesc and populate it into GUID2FuncDescMap
GUID2FuncDescMap.emplace(GUID, MCPseudoProbeFuncDesc(GUID, Hash, Name));		GUID2FuncDescMap.emplace(GUID,
		MCPseudoProbeFuncDesc(GUID, Hash, *It.first));
}		}
assert(Data == End && "Have unprocessed data in pseudo_probe_desc section");		assert(Data == End && "Have unprocessed data in pseudo_probe_desc section");
return true;		return true;
}		}

bool MCPseudoProbeDecoder::buildAddress2ProbeMap(const uint8_t *Start,		bool MCPseudoProbeDecoder::buildAddress2ProbeMap(const uint8_t *Start,
std::size_t Size) {		std::size_t Size) {
// The pseudo_probe section encodes an inline forest and each tree has a		// The pseudo_probe section encodes an inline forest and each tree has a
▲ Show 20 Lines • Show All 205 Lines • Show Last 20 Lines

llvm/tools/llvm-profgen/ProfiledBinary.h

Show First 20 Lines • Show All 206 Lines • ▼ Show 20 Lines	class ProfiledBinary {
std::unique_ptr<const MCInstrInfo> MII;		std::unique_ptr<const MCInstrInfo> MII;
std::unique_ptr<MCDisassembler> DisAsm;		std::unique_ptr<MCDisassembler> DisAsm;
std::unique_ptr<const MCInstrAnalysis> MIA;		std::unique_ptr<const MCInstrAnalysis> MIA;
std::unique_ptr<MCInstPrinter> IPrinter;		std::unique_ptr<MCInstPrinter> IPrinter;
// A list of text sections sorted by start RVA and size. Used to check		// A list of text sections sorted by start RVA and size. Used to check
// if a given RVA is a valid code address.		// if a given RVA is a valid code address.
std::set<std::pair<uint64_t, uint64_t>> TextSections;		std::set<std::pair<uint64_t, uint64_t>> TextSections;

		// Shared string table owning function name strings, keep only one table to
		// save the memory.
		std::unordered_set<std::string> FuncNameStrings;

// A map of mapping function name to BinaryFunction info.		// A map of mapping function name to BinaryFunction info.
std::unordered_map<std::string, BinaryFunction> BinaryFunctions;		StringMap<BinaryFunction> BinaryFunctions;

// An ordered map of mapping function's start offset to function range		// An ordered map of mapping function's start offset to function range
// relevant info. Currently to determine if the offset of ELF is the start of		// relevant info. Currently to determine if the offset of ELF is the start of
// a real function, we leverage the function range info from DWARF.		// a real function, we leverage the function range info from DWARF.
std::map<uint64_t, FuncRange> StartOffset2FuncRangeMap;		std::map<uint64_t, FuncRange> StartOffset2FuncRangeMap;

// Offset to context location map. Used to expand the context.		// Offset to context location map. Used to expand the context.
std::unordered_map<uint64_t, SampleContextFrameVector> Offset2LocStackMap;		std::unordered_map<uint64_t, SampleContextFrameVector> Offset2LocStackMap;
Show All 15 Lines	class ProfiledBinary {
PrologEpilogTracker ProEpilogTracker;		PrologEpilogTracker ProEpilogTracker;

// Track function sizes under different context		// Track function sizes under different context
BinarySizeContextTracker FuncSizeTracker;		BinarySizeContextTracker FuncSizeTracker;

// The symbolizer used to get inline context for an instruction.		// The symbolizer used to get inline context for an instruction.
std::unique_ptr<symbolize::LLVMSymbolizer> Symbolizer;		std::unique_ptr<symbolize::LLVMSymbolizer> Symbolizer;

// String table owning function name strings created from the symbolizer.
std::unordered_set<std::string> NameStrings;

// A collection of functions to print disassembly for.		// A collection of functions to print disassembly for.
StringSet<> DisassembleFunctionSet;		StringSet<> DisassembleFunctionSet;

// Pseudo probe decoder		// Pseudo probe decoder
MCPseudoProbeDecoder ProbeDecoder;		MCPseudoProbeDecoder ProbeDecoder;

bool UsePseudoProbes = false;		bool UsePseudoProbes = false;

▲ Show 20 Lines • Show All 173 Lines • ▼ Show 20 Lines	RangesTy getRangesForOffset(uint64_t Offset) {
auto *FRange = findFuncRangeForOffset(Offset);		auto *FRange = findFuncRangeForOffset(Offset);
// Ignore the range which falls into plt section or system lib.		// Ignore the range which falls into plt section or system lib.
if (!FRange)		if (!FRange)
return RangesTy();		return RangesTy();

return FRange->Func->Ranges;		return FRange->Func->Ranges;
}		}

const std::unordered_map<std::string, BinaryFunction> &		const StringMap<BinaryFunction> &getAllBinaryFunctions() {
getAllBinaryFunctions() {
return BinaryFunctions;		return BinaryFunctions;
}		}

BinaryFunction *getBinaryFunction(StringRef FName) {		BinaryFunction *getBinaryFunction(StringRef FName) {
auto I = BinaryFunctions.find(FName.str());		auto I = BinaryFunctions.find(FName.str());
if (I == BinaryFunctions.end())		if (I == BinaryFunctions.end())
return nullptr;		return nullptr;
return &I->second;		return &I->second;
▲ Show 20 Lines • Show All 88 Lines • Show Last 20 Lines

llvm/tools/llvm-profgen/ProfiledBinary.cpp

Show First 20 Lines • Show All 169 Lines • ▼ Show 20 Lines	for (auto &R : F.second.Ranges) {
}		}
}		}
}		}

if (!hasFuncEntry) {		if (!hasFuncEntry) {
NoFuncEntryNum++;		NoFuncEntryNum++;
if (ShowDetailedWarning)		if (ShowDetailedWarning)
WithColor::warning()		WithColor::warning()
<< "Failed to determine function entry for " << F.first		<< "Failed to determine function entry for " << F.first()
<< " due to inconsistent name from symbol table and dwarf info.\n";		<< " due to inconsistent name from symbol table and dwarf info.\n";
}		}
}		}
emitWarningSummary(NoFuncEntryNum, BinaryFunctions.size(),		emitWarningSummary(NoFuncEntryNum, BinaryFunctions.size(),
"of functions failed to determine function entry due to "		"of functions failed to determine function entry due to "
"inconsistent name from symbol table and dwarf info.");		"inconsistent name from symbol table and dwarf info.");
}		}

▲ Show 20 Lines • Show All 144 Lines • ▼ Show 20 Lines	for (section_iterator SI = Obj->section_begin(), SE = Obj->section_end();
SI != SE; ++SI) {		SI != SE; ++SI) {
const SectionRef &Section = *SI;		const SectionRef &Section = *SI;
StringRef SectionName = unwrapOrError(Section.getName(), FileName);		StringRef SectionName = unwrapOrError(Section.getName(), FileName);

if (SectionName == ".pseudo_probe_desc") {		if (SectionName == ".pseudo_probe_desc") {
StringRef Contents = unwrapOrError(Section.getContents(), FileName);		StringRef Contents = unwrapOrError(Section.getContents(), FileName);
if (!ProbeDecoder.buildGUID2FuncDescMap(		if (!ProbeDecoder.buildGUID2FuncDescMap(
reinterpret_cast<const uint8_t *>(Contents.data()),		reinterpret_cast<const uint8_t *>(Contents.data()),
Contents.size()))		Contents.size(), FuncNameStrings))
exitWithError("Pseudo Probe decoder fail in .pseudo_probe_desc section");		exitWithError("Pseudo Probe decoder fail in .pseudo_probe_desc section");
} else if (SectionName == ".pseudo_probe") {		} else if (SectionName == ".pseudo_probe") {
StringRef Contents = unwrapOrError(Section.getContents(), FileName);		StringRef Contents = unwrapOrError(Section.getContents(), FileName);
if (!ProbeDecoder.buildAddress2ProbeMap(		if (!ProbeDecoder.buildAddress2ProbeMap(
reinterpret_cast<const uint8_t *>(Contents.data()),		reinterpret_cast<const uint8_t *>(Contents.data()),
Contents.size()))		Contents.size()))
exitWithError("Pseudo Probe decoder fail in .pseudo_probe section");		exitWithError("Pseudo Probe decoder fail in .pseudo_probe section");
// set UsePseudoProbes flag, used for PerfReader		// set UsePseudoProbes flag, used for PerfReader
▲ Show 20 Lines • Show All 277 Lines • ▼ Show 20 Lines	for (const auto &DieInfo : CompilationUnit->dies()) {
continue;		continue;
const DWARFAddressRangesVector &Ranges = RangesOrError.get();		const DWARFAddressRangesVector &Ranges = RangesOrError.get();

if (Ranges.empty())		if (Ranges.empty())
continue;		continue;

// Different DWARF symbols can have same function name, search or create		// Different DWARF symbols can have same function name, search or create
// BinaryFunction indexed by the name.		// BinaryFunction indexed by the name.
auto Ret = BinaryFunctions.emplace(Name, BinaryFunction());		// Stablize in a shared function name string table.
		auto It = FuncNameStrings.insert(Name);
		auto Ret = BinaryFunctions.try_emplace(*It.first, BinaryFunction());
auto &Func = Ret.first->second;		auto &Func = Ret.first->second;
if (Ret.second)		if (Ret.second)
Func.FuncName = Ret.first->first;		Func.FuncName = Ret.first->first();

for (const auto &Range : Ranges) {		for (const auto &Range : Ranges) {
uint64_t FuncStart = Range.LowPC;		uint64_t FuncStart = Range.LowPC;
uint64_t FuncSize = Range.HighPC - FuncStart;		uint64_t FuncSize = Range.HighPC - FuncStart;

if (FuncSize == 0 \|\| FuncStart < getPreferredBaseAddress())		if (FuncSize == 0 \|\| FuncStart < getPreferredBaseAddress())
continue;		continue;

▲ Show 20 Lines • Show All 64 Lines • ▼ Show 20 Lines	for (int32_t I = InlineStack.getNumberOfFrames() - 1; I >= 0; I--) {
uint32_t LineOffset = (CallerFrame.Line - CallerFrame.StartLine) & 0xffff;		uint32_t LineOffset = (CallerFrame.Line - CallerFrame.StartLine) & 0xffff;
if (UseProbeDiscriminator) {		if (UseProbeDiscriminator) {
LineOffset =		LineOffset =
PseudoProbeDwarfDiscriminator::extractProbeIndex(Discriminator);		PseudoProbeDwarfDiscriminator::extractProbeIndex(Discriminator);
Discriminator = 0;		Discriminator = 0;
}		}

LineLocation Line(LineOffset, Discriminator);		LineLocation Line(LineOffset, Discriminator);
auto It = NameStrings.insert(FunctionName.str());		auto It = FuncNameStrings.insert(FunctionName.str());
CallStack.emplace_back(*It.first, Line);		CallStack.emplace_back(*It.first, Line);
}		}

return CallStack;		return CallStack;
}		}

void ProfiledBinary::computeInlinedContextSizeForRange(uint64_t StartOffset,		void ProfiledBinary::computeInlinedContextSizeForRange(uint64_t StartOffset,
uint64_t EndOffset) {		uint64_t EndOffset) {
▲ Show 20 Lines • Show All 64 Lines • Show Last 20 Lines