diff --git a/llvm/test/tools/llvm-profgen/cs-invalid-ret-addr.test b/llvm/test/tools/llvm-profgen/cs-invalid-ret-addr.test --- a/llvm/test/tools/llvm-profgen/cs-invalid-ret-addr.test +++ b/llvm/test/tools/llvm-profgen/cs-invalid-ret-addr.test @@ -1,4 +1,4 @@ ; REQUIRES: x86_64-linux -; RUN: llvm-profgen --format=text --perfscript=%S/Inputs/cs-invalid-ret-addr.perfscript --binary=%S/Inputs/noinline-cs-noprobe.perfbin --output=%t 2>&1 | FileCheck %s +; RUN: llvm-profgen --format=text --perfscript=%S/Inputs/cs-invalid-ret-addr.perfscript --binary=%S/Inputs/noinline-cs-noprobe.perfbin --output=%t --show-detailed-warning 2>&1 | FileCheck %s ; CHECK: warning: Truncated stack sample due to invalid return address at 0x400686, likely caused by frame pointer omission diff --git a/llvm/tools/llvm-profgen/PerfReader.h b/llvm/tools/llvm-profgen/PerfReader.h --- a/llvm/tools/llvm-profgen/PerfReader.h +++ b/llvm/tools/llvm-profgen/PerfReader.h @@ -581,10 +581,13 @@ void parseAndAggregateTrace(); // Parse either an MMAP event or a perf sample void parseEventOrSample(TraceStream &TraceIt); + void emitWarningSummary(uint64_t Num, uint64_t Total, StringRef Msg); // Warn if the relevant mmap event is missing. void warnIfMissingMMap(); // Emit accumulate warnings. void warnTruncatedStack(); + // Warn if range is invalid. + void warnInvalidRange(); // Extract call stack from the perf trace lines bool extractCallstack(TraceStream &TraceIt, SmallVectorImpl &CallStack); diff --git a/llvm/tools/llvm-profgen/PerfReader.cpp b/llvm/tools/llvm-profgen/PerfReader.cpp --- a/llvm/tools/llvm-profgen/PerfReader.cpp +++ b/llvm/tools/llvm-profgen/PerfReader.cpp @@ -31,6 +31,10 @@ IgnoreStackSamples("ignore-stack-samples", cl::init(false), cl::ZeroOrMore, cl::desc("Ignore call stack samples for hybrid samples " "and produce context-insensitive profile.")); +static cl::opt + ShowDetailedWarning("show-detailed-warning", cl::init(false), + cl::ZeroOrMore, + cl::desc("Show detailed warning message.")); extern cl::opt PerfTraceFilename; extern cl::opt ShowDisassemblyOnly; @@ -433,10 +437,16 @@ } // Warn about untracked frames due to missing probes. - for (auto Address : AllUntrackedCallsites) - WithColor::warning() << "Profile context truncated due to missing probe " - << "for call instruction at " - << format("0x%" PRIx64, Address) << "\n"; + if (ShowDetailedWarning) { + for (auto Address : AllUntrackedCallsites) + WithColor::warning() << "Profile context truncated due to missing probe " + << "for call instruction at " + << format("0x%" PRIx64, Address) << "\n"; + } + + emitWarningSummary( + AllUntrackedCallsites.size(), SampleCounters.size(), + "Profile context truncated due to missing probe for call instruction."); } bool PerfScriptReader::extractLBRStack(TraceStream &TraceIt, @@ -1008,12 +1018,100 @@ } void PerfScriptReader::warnTruncatedStack() { - for (auto Address : InvalidReturnAddresses) { - WithColor::warning() - << "Truncated stack sample due to invalid return address at " - << format("0x%" PRIx64, Address) - << ", likely caused by frame pointer omission\n"; + if (ShowDetailedWarning) { + for (auto Address : InvalidReturnAddresses) { + WithColor::warning() + << "Truncated stack sample due to invalid return address at " + << format("0x%" PRIx64, Address) + << ", likely caused by frame pointer omission\n"; + } + } + emitWarningSummary(InvalidReturnAddresses.size(), AggregatedSamples.size(), + "Truncated stack sample due to invalid return address, " + "likely caused by frame pointer omission."); +} + +void PerfScriptReader::emitWarningSummary(uint64_t Num, uint64_t Total, + StringRef Msg) { + if (!Total || !Num) + return; + WithColor::warning() << format("%.2f", static_cast(Num) * 100 / Total) + << "%(" << Num << "/" << Total + << ") cases with issue: " << Msg << "\n"; +} + +void PerfScriptReader::warnInvalidRange() { + std::unordered_map, uint64_t, + pair_hash> + Ranges; + + for (const auto &Item : AggregatedSamples) { + const PerfSample *Sample = Item.first.getPtr(); + uint64_t Count = Item.second; + uint64_t EndOffeset = 0; + for (const LBREntry &LBR : Sample->LBRStack) { + uint64_t SourceOffset = Binary->virtualAddrToOffset(LBR.Source); + uint64_t StartOffset = Binary->virtualAddrToOffset(LBR.Target); + if (EndOffeset != 0) + Ranges[{StartOffset, EndOffeset}] += Count; + EndOffeset = SourceOffset; + } } + + if (Ranges.empty()) { + WithColor::warning() << "No samples in perf script!\n"; + return; + } + + auto WarnInvalidRange = + [&](uint64_t StartOffset, uint64_t EndOffset, StringRef Msg) { + if (!ShowDetailedWarning) + return; + WithColor::warning() + << "[" + << format("%8" PRIx64, Binary->offsetToVirtualAddr(StartOffset)) + << "," + << format("%8" PRIx64, Binary->offsetToVirtualAddr(EndOffset)) + << "]: " << Msg << "\n"; + }; + + static const char *EndNotBoundaryMsg = + "Range end is not on instruction boundary."; + static const char *DanglingRangeMsg = + "Range does not belong to any functions, likely from external function."; + static const char *RangeCrossFuncMsg = + "Fall through range should not cross function boundaries."; + + uint64_t EndNotBoundary = 0; + uint64_t DanglingRange = 0; + uint64_t RangeCrossFunc = 0; + + for (auto &I : Ranges) { + uint64_t StartOffset = I.first.first; + uint64_t EndOffset = I.first.second; + + if (!Binary->offsetIsBoundry(EndOffset)) { + EndNotBoundary++; + WarnInvalidRange(StartOffset, EndOffset, EndNotBoundaryMsg); + } + + auto *FRange = Binary->findFuncRangeForOffset(StartOffset); + if (!FRange) { + DanglingRange++; + WarnInvalidRange(StartOffset, EndOffset, DanglingRangeMsg); + continue; + } + + if (EndOffset >= FRange->EndOffset) { + RangeCrossFunc++; + WarnInvalidRange(StartOffset, EndOffset, RangeCrossFuncMsg); + } + } + + uint64_t TotalRangeNum = Ranges.size(); + emitWarningSummary(EndNotBoundary, TotalRangeNum, EndNotBoundaryMsg); + emitWarningSummary(DanglingRange, TotalRangeNum, DanglingRangeMsg); + emitWarningSummary(RangeCrossFunc, TotalRangeNum, RangeCrossFuncMsg); } void PerfScriptReader::parsePerfTraces() { @@ -1022,6 +1120,7 @@ // Generate unsymbolized profile. warnTruncatedStack(); + warnInvalidRange(); generateUnsymbolizedProfile(); if (SkipSymbolization) diff --git a/llvm/tools/llvm-profgen/ProfiledBinary.h b/llvm/tools/llvm-profgen/ProfiledBinary.h --- a/llvm/tools/llvm-profgen/ProfiledBinary.h +++ b/llvm/tools/llvm-profgen/ProfiledBinary.h @@ -207,6 +207,8 @@ std::unordered_set CallAddrs; // A set of return instruction offsets. Used by virtual unwinding. std::unordered_set RetAddrs; + // A set of terminator(branch or return instruction) offsets. + std::unordered_set TerminatorOffsets; // Estimate and track function prolog and epilog ranges. PrologEpilogTracker ProEpilogTracker; @@ -322,6 +324,10 @@ return ProEpilogTracker.PrologEpilogSet.count(Offset); } + bool offsetIsBoundry(uint64_t Offset) { + return TerminatorOffsets.count(Offset) || CallAddrs.count(Offset); + } + uint64_t getAddressforIndex(uint64_t Index) const { return offsetToVirtualAddr(CodeAddrOffsets[Index]); } diff --git a/llvm/tools/llvm-profgen/ProfiledBinary.cpp b/llvm/tools/llvm-profgen/ProfiledBinary.cpp --- a/llvm/tools/llvm-profgen/ProfiledBinary.cpp +++ b/llvm/tools/llvm-profgen/ProfiledBinary.cpp @@ -401,6 +401,9 @@ else if (MCDesc.isReturn()) RetAddrs.insert(Offset); + if (MCDesc.isTerminator()) + TerminatorOffsets.insert(Offset); + if (InvalidInstLength) { WarnInvalidInsts(Offset - InvalidInstLength, Offset - 1); InvalidInstLength = 0;