diff --git a/llvm/tools/llvm-profgen/PerfReader.h b/llvm/tools/llvm-profgen/PerfReader.h --- a/llvm/tools/llvm-profgen/PerfReader.h +++ b/llvm/tools/llvm-profgen/PerfReader.h @@ -541,11 +541,14 @@ std::unordered_map; // Load binaries and read perf trace to parse the events and samples -class PerfReader { - +class PerfReaderBase { public: - PerfReader(cl::list &BinaryFilenames, - cl::list &PerfTraceFilenames); + PerfReaderBase(cl::list &BinaryFilenames); + virtual ~PerfReaderBase() = default; + static std::unique_ptr + create(cl::list &BinaryFilenames, + cl::list &PerfTraceFilenames); + static void loadBinaries(cl::list &BinaryFilenames); // A LBR sample is like: // 0x5c6313f/0x5c63170/P/-/-/0 0x5c630e7/0x5c63130/P/-/-/0 ... @@ -614,10 +617,12 @@ return BinarySampleCounters; } -private: +protected: /// Validate the command line input - void validateCommandLine(cl::list &BinaryFilenames, - cl::list &PerfTraceFilenames); + static void validateCommandLine(cl::list &BinaryFilenames, + cl::list &PerfTraceFilenames); + static PerfScriptType + extractPerfType(cl::list &PerfTraceFilenames); /// Parse a single line of a PERF_RECORD_MMAP2 event looking for a /// mapping between the binary name and its memory layout. /// @@ -626,8 +631,6 @@ void parseAndAggregateTrace(StringRef Filename); // Parse either an MMAP event or a perf sample void parseEventOrSample(TraceStream &TraceIt); - // Parse the hybrid sample including the call and LBR line - void parseHybridSample(TraceStream &TraceIt); // Extract call stack from the perf trace lines bool extractCallstack(TraceStream &TraceIt, SmallVectorImpl &CallStack); @@ -635,13 +638,12 @@ bool extractLBRStack(TraceStream &TraceIt, SmallVectorImpl &LBRStack, ProfiledBinary *Binary); - void checkAndSetPerfType(cl::list &PerfTraceFilenames); + // Parse one sample from multiple perf lines, override this for different + // sample type + virtual void parseSample(TraceStream &TraceIt) = 0; // Post process the profile after trace aggregation, we will do simple range // overlap computation for AutoFDO, or unwind for CSSPGO(hybrid sample). - void generateRawProfile(); - // Unwind the hybrid samples after aggregration - void unwindSamples(); - void printUnwinderOutput(); + virtual void generateRawProfile() = 0; // Helper function for looking up binary in AddressBinaryMap ProfiledBinary *getBinary(uint64_t Address); @@ -654,6 +656,31 @@ PerfScriptType PerfType = PERF_UNKNOWN; }; +/* + Hybrid perf script includes a group of hybrid samples(LBRs + call stack), + which is used to generate CS profile. An example of hybrid sample: + 4005dc # call stack leaf + 400634 + 400684 # call stack root + 0x4005c8/0x4005dc/P/-/-/0 0x40062f/0x4005b0/P/-/-/0 ... + ... 0x4005c8/0x4005dc/P/-/-/0 # LBR Entries +*/ +class HybridPerfReader : public PerfReaderBase { +public: + HybridPerfReader(cl::list &BinaryFilenames) + : PerfReaderBase(BinaryFilenames) { + PerfType = PERF_LBR_STACK; + }; + // Parse the hybrid sample including the call and LBR line + void parseSample(TraceStream &TraceIt) override; + void generateRawProfile() override; + +private: + // Unwind the hybrid samples after aggregration + void unwindSamples(); + void printUnwinderOutput(); +}; + } // end namespace sampleprof } // end namespace llvm diff --git a/llvm/tools/llvm-profgen/PerfReader.cpp b/llvm/tools/llvm-profgen/PerfReader.cpp --- a/llvm/tools/llvm-profgen/PerfReader.cpp +++ b/llvm/tools/llvm-profgen/PerfReader.cpp @@ -241,7 +241,7 @@ return true; } -void PerfReader::validateCommandLine( +void PerfReaderBase::validateCommandLine( cl::list &BinaryFilenames, cl::list &PerfTraceFilenames) { // Allow the invalid perfscript if we only use to show binary disassembly @@ -276,16 +276,39 @@ } } -PerfReader::PerfReader(cl::list &BinaryFilenames, +std::unique_ptr +PerfReaderBase::create(cl::list &BinaryFilenames, cl::list &PerfTraceFilenames) { validateCommandLine(BinaryFilenames, PerfTraceFilenames); + + PerfScriptType PerfType = extractPerfType(PerfTraceFilenames); + std::unique_ptr PerfReader; + if (PerfType == PERF_LBR_STACK) { + PerfReader.reset(new HybridPerfReader(BinaryFilenames)); + } else if (PerfType == PERF_LBR) { + // TODO: + exitWithError("Unsupported perfscript!"); + } else { + exitWithError("Unsupported perfscript!"); + } + + return PerfReader; +} + +PerfReaderBase::PerfReaderBase(cl::list &BinaryFilenames) { // Load the binaries. for (auto Filename : BinaryFilenames) loadBinary(Filename, /*AllowNameConflict*/ false); } -ProfiledBinary &PerfReader::loadBinary(const StringRef BinaryPath, - bool AllowNameConflict) { +void PerfReaderBase::loadBinaries(cl::list &BinaryFilenames) { + for (auto BinaryPath : BinaryFilenames) { + (void)ProfiledBinary(BinaryPath); + } +} + +ProfiledBinary &PerfReaderBase::loadBinary(const StringRef BinaryPath, + bool AllowNameConflict) { // The binary table is currently indexed by the binary name not the full // binary path. This is because the user-given path may not match the one // that was actually executed. @@ -303,7 +326,7 @@ return Ret.first->second; } -void PerfReader::updateBinaryAddress(const MMapEvent &Event) { +void PerfReaderBase::updateBinaryAddress(const MMapEvent &Event) { // Load the binary. StringRef BinaryPath = Event.BinaryPath; StringRef BinaryName = llvm::sys::path::filename(BinaryPath); @@ -353,7 +376,7 @@ } } -ProfiledBinary *PerfReader::getBinary(uint64_t Address) { +ProfiledBinary *PerfReaderBase::getBinary(uint64_t Address) { auto Iter = AddrToBinaryMap.lower_bound(Address); if (Iter == AddrToBinaryMap.end() || Iter->first != Address) { if (Iter == AddrToBinaryMap.begin()) @@ -415,7 +438,7 @@ printSampleCounter(OrderedCounter); } -void PerfReader::printUnwinderOutput() { +void HybridPerfReader::printUnwinderOutput() { for (auto I : BinarySampleCounters) { const ProfiledBinary *Binary = I.first; outs() << "Binary(" << Binary->getName().str() << ")'s Range Counter:\n"; @@ -425,7 +448,7 @@ } } -void PerfReader::unwindSamples() { +void HybridPerfReader::unwindSamples() { for (const auto &Item : AggregatedSamples) { const HybridSample *Sample = dyn_cast(Item.first.getPtr()); VirtualUnwinder Unwinder(&BinarySampleCounters[Sample->Binary], @@ -437,9 +460,9 @@ printUnwinderOutput(); } -bool PerfReader::extractLBRStack(TraceStream &TraceIt, - SmallVectorImpl &LBRStack, - ProfiledBinary *Binary) { +bool PerfReaderBase::extractLBRStack(TraceStream &TraceIt, + SmallVectorImpl &LBRStack, + ProfiledBinary *Binary) { // The raw format of LBR stack is like: // 0x4005c8/0x4005dc/P/-/-/0 0x40062f/0x4005b0/P/-/-/0 ... // ... 0x4005c8/0x4005dc/P/-/-/0 @@ -531,8 +554,8 @@ return !LBRStack.empty(); } -bool PerfReader::extractCallstack(TraceStream &TraceIt, - SmallVectorImpl &CallStack) { +bool PerfReaderBase::extractCallstack(TraceStream &TraceIt, + SmallVectorImpl &CallStack) { // The raw format of call stack is like: // 4005dc # leaf frame // 400634 @@ -593,7 +616,7 @@ !Binary->addressInPrologEpilog(CallStack.front()); } -void PerfReader::parseHybridSample(TraceStream &TraceIt) { +void HybridPerfReader::parseSample(TraceStream &TraceIt) { // The raw hybird sample started with call stack in FILO order and followed // intermediately by LBR sample // e.g. @@ -631,7 +654,7 @@ } } -void PerfReader::parseMMap2Event(TraceStream &TraceIt) { +void PerfReaderBase::parseMMap2Event(TraceStream &TraceIt) { // Parse a line like: // PERF_RECORD_MMAP2 2113428/2113428: [0x7fd4efb57000(0x204000) @ 0 // 08:04 19532229 3585508847]: r-xp /usr/lib64/libdl-2.17.so @@ -677,26 +700,23 @@ TraceIt.advance(); } -void PerfReader::parseEventOrSample(TraceStream &TraceIt) { +void PerfReaderBase::parseEventOrSample(TraceStream &TraceIt) { if (TraceIt.getCurrentLine().startswith("PERF_RECORD_MMAP2")) parseMMap2Event(TraceIt); - else if (getPerfScriptType() == PERF_LBR_STACK) - parseHybridSample(TraceIt); - else { - // TODO: parse other type sample - TraceIt.advance(); - } + else + parseSample(TraceIt); } -void PerfReader::parseAndAggregateTrace(StringRef Filename) { +void PerfReaderBase::parseAndAggregateTrace(StringRef Filename) { // Trace line iterator TraceStream TraceIt(Filename); while (!TraceIt.isAtEoF()) parseEventOrSample(TraceIt); } -void PerfReader::checkAndSetPerfType( - cl::list &PerfTraceFilenames) { +PerfScriptType +PerfReaderBase::extractPerfType(cl::list &PerfTraceFilenames) { + PerfScriptType PerfType = PERF_UNKNOWN; for (auto FileName : PerfTraceFilenames) { PerfScriptType Type = checkPerfScriptType(FileName); if (Type == PERF_INVALID) @@ -705,20 +725,13 @@ exitWithError("Inconsistent sample among different perf scripts"); PerfType = Type; } + return PerfType; } -void PerfReader::generateRawProfile() { - if (getPerfScriptType() == PERF_LBR_STACK) { - // Unwind samples if it's hybird sample - unwindSamples(); - } else if (getPerfScriptType() == PERF_LBR) { - // TODO: range overlap computation for regular AutoFDO - } -} +void HybridPerfReader::generateRawProfile() { unwindSamples(); } -void PerfReader::parsePerfTraces(cl::list &PerfTraceFilenames) { - // Check and set current perfscript type - checkAndSetPerfType(PerfTraceFilenames); +void PerfReaderBase::parsePerfTraces( + cl::list &PerfTraceFilenames) { // Parse perf traces and do aggregation. for (auto Filename : PerfTraceFilenames) parseAndAggregateTrace(Filename); diff --git a/llvm/tools/llvm-profgen/ProfiledBinary.h b/llvm/tools/llvm-profgen/ProfiledBinary.h --- a/llvm/tools/llvm-profgen/ProfiledBinary.h +++ b/llvm/tools/llvm-profgen/ProfiledBinary.h @@ -27,6 +27,7 @@ #include "llvm/MC/MCTargetOptions.h" #include "llvm/Object/ELFObjectFile.h" #include "llvm/ProfileData/SampleProf.h" +#include "llvm/Support/CommandLine.h" #include "llvm/Support/Path.h" #include #include @@ -190,7 +191,7 @@ StringRef getName() const { return llvm::sys::path::filename(Path); } uint64_t getBaseAddress() const { return BaseAddress; } void setBaseAddress(uint64_t Address) { BaseAddress = Address; } - + // Return the preferred load address for the first executable segment. uint64_t getPreferredBaseAddress() const { return PreferredTextSegmentAddresses[0]; } // Return the file offset for the first executable segment. diff --git a/llvm/tools/llvm-profgen/llvm-profgen.cpp b/llvm/tools/llvm-profgen/llvm-profgen.cpp --- a/llvm/tools/llvm-profgen/llvm-profgen.cpp +++ b/llvm/tools/llvm-profgen/llvm-profgen.cpp @@ -49,14 +49,18 @@ cl::HideUnrelatedOptions({&ProfGenCategory, &getColorCategory()}); cl::ParseCommandLineOptions(argc, argv, "llvm SPGO profile generator\n"); - // Load binaries and parse perf events and samples - PerfReader Reader(BinaryFilenames, PerfTraceFilenames); - if (ShowDisassemblyOnly) + if (ShowDisassemblyOnly) { + PerfReaderBase::loadBinaries(BinaryFilenames); return EXIT_SUCCESS; - Reader.parsePerfTraces(PerfTraceFilenames); + } + + // Load binaries and parse perf events and samples + std::unique_ptr Reader = + PerfReaderBase::create(BinaryFilenames, PerfTraceFilenames); + Reader->parsePerfTraces(PerfTraceFilenames); std::unique_ptr Generator = ProfileGenerator::create( - Reader.getBinarySampleCounters(), Reader.getPerfScriptType()); + Reader->getBinarySampleCounters(), Reader->getPerfScriptType()); Generator->generateProfile(); Generator->write();