Diff 375664

llvm/test/tools/llvm-profgen/inline-cs-noprobe.test

	; RUN: llvm-profgen --format=text --perfscript=%S/Inputs/inline-cs-noprobe.perfscript --binary=%S/Inputs/inline-cs-noprobe.perfbin --output=%t --skip-symbolization --profile-summary-cold-count=0			; RUN: llvm-profgen --format=text --perfscript=%S/Inputs/inline-cs-noprobe.perfscript --binary=%S/Inputs/inline-cs-noprobe.perfbin --output=%t --skip-symbolization --profile-summary-cold-count=0
	; RUN: FileCheck %s --input-file %t --check-prefix=CHECK-UNWINDER			; RUN: FileCheck %s --input-file %t --check-prefix=CHECK-UNWINDER
	; RUN: llvm-profgen --format=text --perfscript=%S/Inputs/inline-cs-noprobe.perfscript --binary=%S/Inputs/inline-cs-noprobe.perfbin --output=%t --profile-summary-cold-count=0			; RUN: llvm-profgen --format=text --perfscript=%S/Inputs/inline-cs-noprobe.perfscript --binary=%S/Inputs/inline-cs-noprobe.perfbin --output=%t --profile-summary-cold-count=0
	; RUN: FileCheck %s --input-file %t			; RUN: FileCheck %s --input-file %t
				; RUN: llvm-profgen --format=text --perfscript=%S/Inputs/inline-cs-noprobe.perfscript --binary=%S/Inputs/inline-cs-noprobe.perfbin --output=%t --profile-summary-cold-count=0 --ignore-stack-samples
				; RUN: FileCheck %s --input-file %t --check-prefix=CHECK-STRIP-CTX

	; CHECK:[main:1 @ foo]:309:0			; CHECK:[main:1 @ foo]:309:0
	; CHECK: 2.1: 14			; CHECK: 2.1: 14
	; CHECK: 3: 15			; CHECK: 3: 15
	; CHECK: 3.1: 14 bar:14			; CHECK: 3.1: 14 bar:14
	; CHECK: 3.2: 1			; CHECK: 3.2: 1
	; CHECK:[main:1 @ foo:3.1 @ bar]:84:0			; CHECK:[main:1 @ foo:3.1 @ bar]:84:0
	; CHECK: 1: 14			; CHECK: 1: 14

				; CHECK-STRIP-CTX: main:379:0
				; CHECK-STRIP-CTX: 0: 0
				; CHECK-STRIP-CTX: 2: 0
				; CHECK-STRIP-CTX: 1: foo:379
				; CHECK-STRIP-CTX: 2.1: 14
				; CHECK-STRIP-CTX: 3: 15
				; CHECK-STRIP-CTX: 3.2: 1
				; CHECK-STRIP-CTX: 4: 0
				; CHECK-STRIP-CTX: 7: 0
				; CHECK-STRIP-CTX: 3.1: bar:84
				; CHECK-STRIP-CTX: 1: 14

	; CHECK-UNWINDER: [main:1 @ foo]			; CHECK-UNWINDER: [main:1 @ foo]
	; CHECK-UNWINDER: 4			; CHECK-UNWINDER: 4
	; CHECK-UNWINDER: 670-6ad:1			; CHECK-UNWINDER: 670-6ad:1
	; CHECK-UNWINDER: 67e-69b:1			; CHECK-UNWINDER: 67e-69b:1
	; CHECK-UNWINDER: 67e-6ad:13			; CHECK-UNWINDER: 67e-6ad:13
	; CHECK-UNWINDER: 6bd-6c8:14			; CHECK-UNWINDER: 6bd-6c8:14
	; CHECK-UNWINDER: 2			; CHECK-UNWINDER: 2
	; CHECK-UNWINDER: 69b->670:1			; CHECK-UNWINDER: 69b->670:1
	Show All 28 Lines

llvm/test/tools/llvm-profgen/noinline-cs-noprobe.test

	;; The test fails on Windows. Fix it before removing the following requirement.			;; The test fails on Windows. Fix it before removing the following requirement.
	; REQUIRES: x86_64-linux			; REQUIRES: x86_64-linux
	; RUN: llvm-profgen --format=text --perfscript=%S/Inputs/noinline-cs-noprobe.perfscript --binary=%S/Inputs/noinline-cs-noprobe.perfbin --output=%t --skip-symbolization --profile-summary-cold-count=0			; RUN: llvm-profgen --format=text --perfscript=%S/Inputs/noinline-cs-noprobe.perfscript --binary=%S/Inputs/noinline-cs-noprobe.perfbin --output=%t --skip-symbolization --profile-summary-cold-count=0
	; RUN: FileCheck %s --input-file %t --check-prefix=CHECK-UNWINDER			; RUN: FileCheck %s --input-file %t --check-prefix=CHECK-UNWINDER
	; RUN: llvm-profgen --format=text --perfscript=%S/Inputs/noinline-cs-noprobe.perfscript --binary=%S/Inputs/noinline-cs-noprobe.perfbin --output=%t --profile-summary-cold-count=0			; RUN: llvm-profgen --format=text --perfscript=%S/Inputs/noinline-cs-noprobe.perfscript --binary=%S/Inputs/noinline-cs-noprobe.perfbin --output=%t --profile-summary-cold-count=0
	; RUN: FileCheck %s --input-file %t			; RUN: FileCheck %s --input-file %t
				; RUN: llvm-profgen --format=text --perfscript=%S/Inputs/noinline-cs-noprobe.perfscript --binary=%S/Inputs/noinline-cs-noprobe.perfbin --output=%t --profile-summary-cold-count=0 --ignore-stack-samples
				; RUN: FileCheck %s --input-file %t --check-prefix=CHECK-STRIP-CTX
	; RUN: llvm-profgen --format=text --perfscript=%S/Inputs/noinline-cs-noprobe.aggperfscript --binary=%S/Inputs/noinline-cs-noprobe.perfbin --output=%t --skip-symbolization --profile-summary-cold-count=0			; RUN: llvm-profgen --format=text --perfscript=%S/Inputs/noinline-cs-noprobe.aggperfscript --binary=%S/Inputs/noinline-cs-noprobe.perfbin --output=%t --skip-symbolization --profile-summary-cold-count=0
	; RUN: FileCheck %s --input-file %t --check-prefix=CHECK-AGG-UNWINDER			; RUN: FileCheck %s --input-file %t --check-prefix=CHECK-AGG-UNWINDER
	; RUN: llvm-profgen --format=text --perfscript=%S/Inputs/noinline-cs-noprobe.aggperfscript --binary=%S/Inputs/noinline-cs-noprobe.perfbin --output=%t --profile-summary-cold-count=0			; RUN: llvm-profgen --format=text --perfscript=%S/Inputs/noinline-cs-noprobe.aggperfscript --binary=%S/Inputs/noinline-cs-noprobe.perfbin --output=%t --profile-summary-cold-count=0
	; RUN: FileCheck %s --input-file %t --check-prefix=CHECK-AGG			; RUN: FileCheck %s --input-file %t --check-prefix=CHECK-AGG

	; RUN: llvm-profgen --format=text --perfscript=%S/Inputs/noinline-cs-noprobe.perfscript --binary=%S/Inputs/noinline-cs-noprobe.perfbin --output=%t1 --profile-summary-cold-count=0			; RUN: llvm-profgen --format=text --perfscript=%S/Inputs/noinline-cs-noprobe.perfscript --binary=%S/Inputs/noinline-cs-noprobe.perfbin --output=%t1 --profile-summary-cold-count=0
	; RUN: llvm-profgen --format=extbinary --perfscript=%S/Inputs/noinline-cs-noprobe.perfscript --binary=%S/Inputs/noinline-cs-noprobe.perfbin --output=%t2 --profile-summary-cold-count=0 -use-md5			; RUN: llvm-profgen --format=extbinary --perfscript=%S/Inputs/noinline-cs-noprobe.perfscript --binary=%S/Inputs/noinline-cs-noprobe.perfbin --output=%t2 --profile-summary-cold-count=0 -use-md5
	; RUN: llvm-profdata show --sample -show-sec-info-only %t2 \| FileCheck %s --check-prefix=CHECK-MD5			; RUN: llvm-profdata show --sample -show-sec-info-only %t2 \| FileCheck %s --check-prefix=CHECK-MD5
	Show All 38 Lines
	; CHECK: 3: 3 bar:3			; CHECK: 3: 3 bar:3
	; CHECK:[main:1 @ foo:3 @ bar]:50:3			; CHECK:[main:1 @ foo:3 @ bar]:50:3
	; CHECK: 0: 3			; CHECK: 0: 3
	; CHECK: 1: 3			; CHECK: 1: 3
	; CHECK: 2: 2			; CHECK: 2: 2
	; CHECK: 4: 1			; CHECK: 4: 1
	; CHECK: 5: 3			; CHECK: 5: 3

				; CHECK-STRIP-CTX: foo:57:0
				; CHECK-STRIP-CTX: 0: 0
				; CHECK-STRIP-CTX: 1: 0
				; CHECK-STRIP-CTX: 2: 3
				; CHECK-STRIP-CTX: 3: 3 bar:3
				; CHECK-STRIP-CTX: 4: 0
				; CHECK-STRIP-CTX: 5: 0
				; CHECK-STRIP-CTX: bar:50:3
				; CHECK-STRIP-CTX: 0: 3
				; CHECK-STRIP-CTX: 1: 3
				; CHECK-STRIP-CTX: 2: 2
				; CHECK-STRIP-CTX: 4: 1
				; CHECK-STRIP-CTX: 5: 3

	; CHECK-UNWINDER: [main:1 @ foo]			; CHECK-UNWINDER: [main:1 @ foo]
	; CHECK-UNWINDER-NEXT: 3			; CHECK-UNWINDER-NEXT: 3
	; CHECK-UNWINDER-NEXT: 5ff-62f:3			; CHECK-UNWINDER-NEXT: 5ff-62f:3
	; CHECK-UNWINDER-NEXT: 634-637:3			; CHECK-UNWINDER-NEXT: 634-637:3
	; CHECK-UNWINDER-NEXT: 645-645:3			; CHECK-UNWINDER-NEXT: 645-645:3
	; CHECK-UNWINDER-NEXT: 3			; CHECK-UNWINDER-NEXT: 3
	; CHECK-UNWINDER-NEXT: 62f->5b0:3			; CHECK-UNWINDER-NEXT: 62f->5b0:3
	▲ Show 20 Lines • Show All 41 Lines • Show Last 20 Lines

llvm/tools/llvm-profgen/PerfReader.h

Show First 20 Lines • Show All 568 Lines • ▼ Show 20 Lines	struct MMapEvent {
uint64_t PID = 0;		uint64_t PID = 0;
uint64_t Address = 0;		uint64_t Address = 0;
uint64_t Size = 0;		uint64_t Size = 0;
uint64_t Offset = 0;		uint64_t Offset = 0;
StringRef BinaryPath;		StringRef BinaryPath;
};		};

void updateBinaryAddress(const MMapEvent &Event);		void updateBinaryAddress(const MMapEvent &Event);
PerfScriptType getPerfScriptType() const { return PerfType; }
// Entry of the reader to parse multiple perf traces		// Entry of the reader to parse multiple perf traces
void parsePerfTraces(cl::list<std::string> &PerfTraceFilenames);		void parsePerfTraces(cl::list<std::string> &PerfTraceFilenames);
const ContextSampleCounterMap &getSampleCounters() const {		const ContextSampleCounterMap &getSampleCounters() const {
return SampleCounters;		return SampleCounters;
}		}
		bool profileIsCS() { return ProfileIsCS; }

protected:		protected:
static PerfScriptType		static PerfScriptType
extractPerfType(cl::list<std::string> &PerfTraceFilenames);		extractPerfType(cl::list<std::string> &PerfTraceFilenames);
/// Parse a single line of a PERF_RECORD_MMAP2 event looking for a		/// Parse a single line of a PERF_RECORD_MMAP2 event looking for a
/// mapping between the binary name and its memory layout.		/// mapping between the binary name and its memory layout.
///		///
void parseMMap2Event(TraceStream &TraceIt);		void parseMMap2Event(TraceStream &TraceIt);
Show All 15 Lines	protected:
// Parse one sample from multiple perf lines, override this for different		// Parse one sample from multiple perf lines, override this for different
// sample type		// sample type
void parseSample(TraceStream &TraceIt);		void parseSample(TraceStream &TraceIt);
// An aggregated count is given to indicate how many times the sample is		// An aggregated count is given to indicate how many times the sample is
// repeated.		// repeated.
virtual void parseSample(TraceStream &TraceIt, uint64_t Count) = 0;		virtual void parseSample(TraceStream &TraceIt, uint64_t Count) = 0;
// Post process the profile after trace aggregation, we will do simple range		// Post process the profile after trace aggregation, we will do simple range
// overlap computation for AutoFDO, or unwind for CSSPGO(hybrid sample).		// overlap computation for AutoFDO, or unwind for CSSPGO(hybrid sample).
virtual void generateRawProfile() = 0;		virtual void generateRawProfile() = 0;
		wenleiUnsubmitted Not Done Reply Inline Actions This is now defined both in LBRPerfReader and PerfReaderBase? Is that intended? And it's not virtual, and yet declared as protected.. wenlei: This is now defined both in LBRPerfReader and PerfReaderBase? Is that intended? And it's not…
		wleiAuthorUnsubmitted Done Reply Inline Actions removed wlei: removed
void writeRawProfile(StringRef Filename);		void writeRawProfile(StringRef Filename);
void writeRawProfile(raw_fd_ostream &OS);		void writeRawProfile(raw_fd_ostream &OS);

ProfiledBinary *Binary = nullptr;		ProfiledBinary *Binary = nullptr;

ContextSampleCounterMap SampleCounters;		ContextSampleCounterMap SampleCounters;
// Samples with the repeating time generated by the perf reader		// Samples with the repeating time generated by the perf reader
AggregatedCounter AggregatedSamples;		AggregatedCounter AggregatedSamples;
PerfScriptType PerfType = PERF_UNKNOWN;		PerfScriptType PerfType = PERF_UNKNOWN;
// Keep track of all invalid return addresses		// Keep track of all invalid return addresses
std::set<uint64_t> InvalidReturnAddresses;		std::set<uint64_t> InvalidReturnAddresses;

		bool ProfileIsCS = false;
		};

		/*
		The reader of LBR only perf script.
		A typical LBR sample is like:
		40062f 0x4005c8/0x4005dc/P/-/-/0 0x40062f/0x4005b0/P/-/-/0 ...
		... 0x4005c8/0x4005dc/P/-/-/0
		*/
		class LBRPerfReader : public PerfReaderBase {
		public:
		LBRPerfReader(ProfiledBinary *Binary) : PerfReaderBase(Binary) {
		PerfType = PERF_LBR;
		};
		// Parse the LBR only sample.
		virtual void parseSample(TraceStream &TraceIt, uint64_t Count) override;
		virtual void generateRawProfile() override;

		private:
		void computeCounterFromLBR(const PerfSample *Sample, uint64_t Repeat);
		wenleiUnsubmitted Not Done Reply Inline Actions Can this be private just like before? wenlei: Can this be private just like before?
};		};

/*		/*
Hybrid perf script includes a group of hybrid samples(LBRs + call stack),		Hybrid perf script includes a group of hybrid samples(LBRs + call stack),
which is used to generate CS profile. An example of hybrid sample:		which is used to generate CS profile. An example of hybrid sample:
4005dc # call stack leaf		4005dc # call stack leaf
400634		400634
400684 # call stack root		400684 # call stack root
0x4005c8/0x4005dc/P/-/-/0 0x40062f/0x4005b0/P/-/-/0 ...		0x4005c8/0x4005dc/P/-/-/0 0x40062f/0x4005b0/P/-/-/0 ...
... 0x4005c8/0x4005dc/P/-/-/0 # LBR Entries		... 0x4005c8/0x4005dc/P/-/-/0 # LBR Entries
*/		*/
class HybridPerfReader : public PerfReaderBase {		class HybridPerfReader : public LBRPerfReader {
public:		public:
HybridPerfReader(ProfiledBinary *Binary) : PerfReaderBase(Binary) {		HybridPerfReader(ProfiledBinary *Binary) : LBRPerfReader(Binary) {
PerfType = PERF_LBR_STACK;		PerfType = PERF_LBR_STACK;
};		};
// Parse the hybrid sample including the call and LBR line		// Parse the hybrid sample including the call and LBR line
void parseSample(TraceStream &TraceIt, uint64_t Count) override;		void parseSample(TraceStream &TraceIt, uint64_t Count) override;
void generateRawProfile() override;		void generateRawProfile() override;

private:		private:
// Unwind the hybrid samples after aggregration		// Unwind the hybrid samples after aggregration
void unwindSamples();		void unwindSamples();
};		};

/*
The reader of LBR only perf script.
A typical LBR sample is like:
40062f 0x4005c8/0x4005dc/P/-/-/0 0x40062f/0x4005b0/P/-/-/0 ...
... 0x4005c8/0x4005dc/P/-/-/0
*/
class LBRPerfReader : public PerfReaderBase {
public:
LBRPerfReader(ProfiledBinary *Binary) : PerfReaderBase(Binary) {
// There is no context for LBR only sample, so initialize one entry with
// fake "empty" context key.
std::shared_ptr<StringBasedCtxKey> Key =
std::make_shared<StringBasedCtxKey>();
Key->genHashCode();
SampleCounters.emplace(Hashable<ContextKey>(Key), SampleCounter());
PerfType = PERF_LBR;
};

// Parse the LBR only sample.
void parseSample(TraceStream &TraceIt, uint64_t Count) override;
void generateRawProfile() override;

private:
void computeCounterFromLBR(const PerfSample *Sample, uint64_t Repeat);
};

} // end namespace sampleprof		} // end namespace sampleprof
} // end namespace llvm		} // end namespace llvm

#endif		#endif

llvm/tools/llvm-profgen/PerfReader.cpp

Show All 16 Lines

cl::opt<bool> SkipSymbolization("skip-symbolization", cl::ReallyHidden,		cl::opt<bool> SkipSymbolization("skip-symbolization", cl::ReallyHidden,
cl::init(false), cl::ZeroOrMore,		cl::init(false), cl::ZeroOrMore,
cl::desc("Dump the unsymbolized profile to the "		cl::desc("Dump the unsymbolized profile to the "
"output file. It will show unwinder "		"output file. It will show unwinder "
"output for CS profile generation."));		"output for CS profile generation."));
cl::opt<bool> UseOffset("use-offset", cl::ReallyHidden, cl::init(true),		cl::opt<bool> UseOffset("use-offset", cl::ReallyHidden, cl::init(true),
cl::ZeroOrMore,		cl::ZeroOrMore,
cl::desc("Work with `--skip-symbolization` to dump the "		cl::desc("Work with `--skip-symbolization` to dump the "
		wenleiUnsubmitted Not Done Reply Inline Actions Use `ignore-stack-samples`? wenlei: Use `ignore-stack-samples`?
		wleiAuthorUnsubmitted Done Reply Inline Actions Sounds good! wlei: Sounds good!
"offset instead of virtual address."));		"offset instead of virtual address."));
		hoyUnsubmitted Not Done Reply Inline Actions nit: sample -> samples hoy: nit: sample -> samples
		wleiAuthorUnsubmitted Done Reply Inline Actions fixed! wlei: fixed!
		cl::opt<bool>
		IgnoreStackSamples("ignore-stack-samples", cl::ReallyHidden,
		cl::init(false), cl::ZeroOrMore,
		cl::desc("Ignore call stack samples for hybrid samples "
		"and produce context-insensitive profile."));

extern cl::opt<bool> ShowDisassemblyOnly;		extern cl::opt<bool> ShowDisassemblyOnly;
extern cl::opt<bool> ShowSourceLocations;		extern cl::opt<bool> ShowSourceLocations;
extern cl::opt<std::string> OutputFilename;		extern cl::opt<std::string> OutputFilename;

namespace llvm {		namespace llvm {
namespace sampleprof {		namespace sampleprof {

▲ Show 20 Lines • Show All 325 Lines • ▼ Show 20 Lines	AllUntrackedCallsites.insert(CurrUntrackedCallsites.begin(),
CurrUntrackedCallsites.end());		CurrUntrackedCallsites.end());
}		}

// Warn about untracked frames due to missing probes.		// Warn about untracked frames due to missing probes.
for (auto Address : AllUntrackedCallsites)		for (auto Address : AllUntrackedCallsites)
WithColor::warning() << "Profile context truncated due to missing probe "		WithColor::warning() << "Profile context truncated due to missing probe "
<< "for call instruction at "		<< "for call instruction at "
<< format("%" PRIx64, Address) << "\n";		<< format("%" PRIx64, Address) << "\n";

if (SkipSymbolization)
writeRawProfile(OutputFilename);
}		}

bool PerfReaderBase::extractLBRStack(TraceStream &TraceIt,		bool PerfReaderBase::extractLBRStack(TraceStream &TraceIt,
SmallVectorImpl<LBREntry> &LBRStack) {		SmallVectorImpl<LBREntry> &LBRStack) {
// The raw format of LBR stack is like:		// The raw format of LBR stack is like:
// 0x4005c8/0x4005dc/P/-/-/0 0x40062f/0x4005b0/P/-/-/0 ...		// 0x4005c8/0x4005dc/P/-/-/0 0x40062f/0x4005b0/P/-/-/0 ...
// ... 0x4005c8/0x4005dc/P/-/-/0		// ... 0x4005c8/0x4005dc/P/-/-/0
// It's in FIFO order and seperated by whitespace.		// It's in FIFO order and seperated by whitespace.
▲ Show 20 Lines • Show All 291 Lines • ▼ Show 20 Lines	void LBRPerfReader::parseSample(TraceStream &TraceIt, uint64_t Count) {
if (extractLBRStack(TraceIt, Sample->LBRStack)) {		if (extractLBRStack(TraceIt, Sample->LBRStack)) {
warnIfMissingMMap();		warnIfMissingMMap();
// Record LBR only samples by aggregation		// Record LBR only samples by aggregation
AggregatedSamples[Hashable<PerfSample>(Sample)] += Count;		AggregatedSamples[Hashable<PerfSample>(Sample)] += Count;
}		}
}		}

void LBRPerfReader::generateRawProfile() {		void LBRPerfReader::generateRawProfile() {
assert(SampleCounters.size() == 1 && "Must have one entry of sample counter");		// There is no context for LBR only sample, so initialize one entry with
		// fake "empty" context key.
		assert(SampleCounters.empty() &&
		"Sample counter map should be empty before raw profile generation");
		std::shared_ptr<StringBasedCtxKey> Key =
		std::make_shared<StringBasedCtxKey>();
		Key->genHashCode();
		SampleCounters.emplace(Hashable<ContextKey>(Key), SampleCounter());
		wenleiUnsubmitted Not Done Reply Inline Actions assert SampleCounters.size is zero then? wenlei: assert SampleCounters.size is zero then?
		wleiAuthorUnsubmitted Done Reply Inline Actions added! wlei: added!
for (const auto &Item : AggregatedSamples) {		for (const auto &Item : AggregatedSamples) {
const PerfSample *Sample = Item.first.getPtr();		const PerfSample *Sample = Item.first.getPtr();
computeCounterFromLBR(Sample, Item.second);		computeCounterFromLBR(Sample, Item.second);
}		}

if (SkipSymbolization)
PerfReaderBase::writeRawProfile(OutputFilename);
}		}

uint64_t PerfReaderBase::parseAggregatedCount(TraceStream &TraceIt) {		uint64_t PerfReaderBase::parseAggregatedCount(TraceStream &TraceIt) {
// The aggregated count is optional, so do not skip the line and return 1 if		// The aggregated count is optional, so do not skip the line and return 1 if
// it's unmatched		// it's unmatched
uint64_t Count = 1;		uint64_t Count = 1;
if (!TraceIt.getCurrentLine().getAsInteger(10, Count))		if (!TraceIt.getCurrentLine().getAsInteger(10, Count))
TraceIt.advance();		TraceIt.advance();
▲ Show 20 Lines • Show All 75 Lines • ▼ Show 20 Lines	if (Type == PERF_INVALID)
exitWithError("Invalid perf script input!");		exitWithError("Invalid perf script input!");
if (PerfType != PERF_UNKNOWN && PerfType != Type)		if (PerfType != PERF_UNKNOWN && PerfType != Type)
exitWithError("Inconsistent sample among different perf scripts");		exitWithError("Inconsistent sample among different perf scripts");
PerfType = Type;		PerfType = Type;
}		}
return PerfType;		return PerfType;
}		}

void HybridPerfReader::generateRawProfile() { unwindSamples(); }		void HybridPerfReader::generateRawProfile() {
		ProfileIsCS = !IgnoreStackSamples;
		wenleiUnsubmitted Not Done Reply Inline Actions nit: make sure we update ProfileIsCS properly for both cases and not relying on current value. ProfileIsCS = !IgnoreStackSamples; if (ProfileIsCS) unwindSamples(); else LBRPerfReader::generateRawProfile(); wenlei: nit: make sure we update ProfileIsCS properly for both cases and not relying on current value.
		wleiAuthorUnsubmitted Done Reply Inline Actions Good idea! wlei: Good idea!
		if (ProfileIsCS)
		wenleiUnsubmitted Not Done Reply Inline Actions Where do we check PerfType later? If PerfType is meant to be input type, can we not set it to PERF_LBR since input type which is indeed hybrid? If we meant to use PerfType to indicate "processing mode", perhaps we should then set it to PERF_LBR earlier in extractPerfType, then create LBRPerfReader and teach it to ignore stack samples. That also avoids changing to have HybridPerfReader derive from LBRPerfReader.. Change the type half way seems inconsistent. wenlei: Where do we check PerfType later? If PerfType is meant to be input type, can we not set it to…
		wleiAuthorUnsubmitted Done Reply Inline Actions Agree with you except I still prefer LBRPerfReader only responsible for PERF_LBR and HybridPerfReader only for PERF_LBR_STACK otherwise we need to maintain two part of code for the hybrid sample parsing. On second thought, I think we already know whether it's a CS/Non-CS [raw] profile in PerfReader, so we can move the `genRawProfiles` logic out of `parsePerfTraces`. In `parsePerfTraces` , we only do populate `perfSample`. Then for `genRawProfiles` based on the perf type or `ignore-stack-samples` , it can decide to generate a CS raw profile or a non-CS raw profile. With this, we now pass a new flag `ProfileIsCS` to the generator instead of the perf_type. Updated the code here, see if this looks good to you? wlei: Agree with you except I still prefer LBRPerfReader only responsible for PERF_LBR and…
		wenleiUnsubmitted Not Done Reply Inline Actions I still prefer LBRPerfReader only responsible for PERF_LBR and HybridPerfReader only for PERF_LBR_STACK otherwise we need to maintain two part of code for the hybrid sample parsing. Yeah, we don't want to duplicate the code for sure. I'm not sure about the refactoring to move unwind etc all into the base class though. I feel the unwind and hybrid sample parsing belong to HybridPerfReader, otherwise why do we need a HybridPerfReader.. Can we call `LBRPerfReader::generateRawProfile()` here in `HybridPerfReader::generateRawProfile()` just like what you had before, but without setting `PerfType` to `PERF_LBR`? wenlei: > I still prefer LBRPerfReader only responsible for PERF_LBR and HybridPerfReader only for…
		hoyUnsubmitted Not Done Reply Inline Actions Can we call LBRPerfReader::generateRawProfile() here in HybridPerfReader::generateRawProfile() just like what you had before, but without setting PerfType to PERF_LBR? This sounds good to me. We still need to parse stack samples even with `IgnoreStackSamples` , but we don't need to unwind them. hoy: > Can we call LBRPerfReader::generateRawProfile() here in HybridPerfReader::generateRawProfile…
		wleiAuthorUnsubmitted Done Reply Inline Actions Sounds good to make unwinder into `HybridPerfReader` . wlei: Sounds good to make unwinder into `HybridPerfReader `.
		unwindSamples();
		else
		LBRPerfReader::generateRawProfile();
		}

void PerfReaderBase::warnTruncatedStack() {		void PerfReaderBase::warnTruncatedStack() {
for (auto Address : InvalidReturnAddresses) {		for (auto Address : InvalidReturnAddresses) {
WithColor::warning()		WithColor::warning()
<< "Truncated stack sample due to invalid return address at "		<< "Truncated stack sample due to invalid return address at "
<< format("0x%" PRIx64, Address)		<< format("0x%" PRIx64, Address)
<< ", likely caused by frame pointer omission\n";		<< ", likely caused by frame pointer omission\n";
}		}
}		}

void PerfReaderBase::parsePerfTraces(		void PerfReaderBase::parsePerfTraces(
cl::list<std::string> &PerfTraceFilenames) {		cl::list<std::string> &PerfTraceFilenames) {
// Parse perf traces and do aggregation.		// Parse perf traces and do aggregation.
for (auto Filename : PerfTraceFilenames)		for (auto Filename : PerfTraceFilenames)
parseAndAggregateTrace(Filename);		parseAndAggregateTrace(Filename);

warnTruncatedStack();		warnTruncatedStack();
generateRawProfile();		generateRawProfile();

		if (SkipSymbolization)
		writeRawProfile(OutputFilename);
}		}

} // end namespace sampleprof		} // end namespace sampleprof
} // end namespace llvm		} // end namespace llvm

llvm/tools/llvm-profgen/ProfileGenerator.h

	Show All 28 Lines

	public:			public:
	ProfileGeneratorBase(ProfiledBinary *Binary,			ProfileGeneratorBase(ProfiledBinary *Binary,
	const ContextSampleCounterMap &Counters)			const ContextSampleCounterMap &Counters)
	: Binary(Binary), SampleCounters(Counters){};			: Binary(Binary), SampleCounters(Counters){};
	virtual ~ProfileGeneratorBase() = default;			virtual ~ProfileGeneratorBase() = default;
	static std::unique_ptr<ProfileGeneratorBase>			static std::unique_ptr<ProfileGeneratorBase>
	create(ProfiledBinary *Binary, const ContextSampleCounterMap &SampleCounters,			create(ProfiledBinary *Binary, const ContextSampleCounterMap &SampleCounters,
	enum PerfScriptType SampleType);			bool ProfileIsCS);
	virtual void generateProfile() = 0;			virtual void generateProfile() = 0;
	void write();			void write();

	protected:			protected:
	// Use SampleProfileWriter to serialize profile map			// Use SampleProfileWriter to serialize profile map
	void write(std::unique_ptr<SampleProfileWriter> Writer,			void write(std::unique_ptr<SampleProfileWriter> Writer,
	SampleProfileMap &ProfileMap);			SampleProfileMap &ProfileMap);
	/*			/*
	▲ Show 20 Lines • Show All 234 Lines • Show Last 20 Lines

llvm/tools/llvm-profgen/ProfileGenerator.cpp

	Show First 20 Lines • Show All 71 Lines • ▼ Show 20 Lines
	// Initialize the MaxCompressionSize to -1 which means no size limit			// Initialize the MaxCompressionSize to -1 which means no size limit
	int32_t CSProfileGenerator::MaxCompressionSize = -1;			int32_t CSProfileGenerator::MaxCompressionSize = -1;

	int CSProfileGenerator::MaxContextDepth = -1;			int CSProfileGenerator::MaxContextDepth = -1;

	std::unique_ptr<ProfileGeneratorBase>			std::unique_ptr<ProfileGeneratorBase>
	ProfileGeneratorBase::create(ProfiledBinary *Binary,			ProfileGeneratorBase::create(ProfiledBinary *Binary,
	const ContextSampleCounterMap &SampleCounters,			const ContextSampleCounterMap &SampleCounters,
	enum PerfScriptType SampleType) {			bool ProfileIsCS) {
	std::unique_ptr<ProfileGeneratorBase> Generator;			std::unique_ptr<ProfileGeneratorBase> Generator;
	if (SampleType == PERF_LBR) {			if (ProfileIsCS) {
	// TODO: Support probe based profile generation
	Generator.reset(new ProfileGenerator(Binary, SampleCounters));
	} else if (SampleType == PERF_LBR_STACK) {
	Generator.reset(new CSProfileGenerator(Binary, SampleCounters));			Generator.reset(new CSProfileGenerator(Binary, SampleCounters));
	} else {			} else {
	llvm_unreachable("Unsupported perfscript!");			Generator.reset(new ProfileGenerator(Binary, SampleCounters));
	}			}

	return Generator;			return Generator;
	}			}

	void ProfileGeneratorBase::write(std::unique_ptr<SampleProfileWriter> Writer,			void ProfileGeneratorBase::write(std::unique_ptr<SampleProfileWriter> Writer,
	SampleProfileMap &ProfileMap) {			SampleProfileMap &ProfileMap) {
	if (std::error_code EC = Writer->write(ProfileMap))			if (std::error_code EC = Writer->write(ProfileMap))
	▲ Show 20 Lines • Show All 721 Lines • Show Last 20 Lines

llvm/tools/llvm-profgen/llvm-profgen.cpp

Show First 20 Lines • Show All 83 Lines • ▼ Show 20 Lines	std::unique_ptr<ProfiledBinary> Binary =
std::make_unique<ProfiledBinary>(BinaryPath);		std::make_unique<ProfiledBinary>(BinaryPath);
if (ShowDisassemblyOnly)		if (ShowDisassemblyOnly)
return EXIT_SUCCESS;		return EXIT_SUCCESS;

// Parse perf events and samples		// Parse perf events and samples
std::unique_ptr<PerfReaderBase> Reader =		std::unique_ptr<PerfReaderBase> Reader =
PerfReaderBase::create(Binary.get(), PerfTraceFilenames);		PerfReaderBase::create(Binary.get(), PerfTraceFilenames);
Reader->parsePerfTraces(PerfTraceFilenames);		Reader->parsePerfTraces(PerfTraceFilenames);

		wenleiUnsubmitted Not Done Reply Inline Actions Can we revert this change too and move `generateRawProfile` back into `parsePerfTraces`? wenlei: Can we revert this change too and move `generateRawProfile` back into `parsePerfTraces`?
		wleiAuthorUnsubmitted Done Reply Inline Actions fixed! wlei: fixed!
if (SkipSymbolization)		if (SkipSymbolization)
return EXIT_SUCCESS;		return EXIT_SUCCESS;

std::unique_ptr<ProfileGeneratorBase> Generator =		std::unique_ptr<ProfileGeneratorBase> Generator =
ProfileGeneratorBase::create(Binary.get(), Reader->getSampleCounters(),		ProfileGeneratorBase::create(Binary.get(), Reader->getSampleCounters(),
Reader->getPerfScriptType());		Reader->profileIsCS());
Generator->generateProfile();		Generator->generateProfile();
Generator->write();		Generator->write();

return EXIT_SUCCESS;		return EXIT_SUCCESS;
}		}

This is an archive of the discontinued LLVM Phabricator instance.

[llvm-profgen] Strip context to support non-CS profile generation for hybrid sample
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 375664

llvm/test/tools/llvm-profgen/inline-cs-noprobe.test

llvm/test/tools/llvm-profgen/noinline-cs-noprobe.test

llvm/tools/llvm-profgen/PerfReader.h

llvm/tools/llvm-profgen/PerfReader.cpp

llvm/tools/llvm-profgen/ProfileGenerator.h

llvm/tools/llvm-profgen/ProfileGenerator.cpp

llvm/tools/llvm-profgen/llvm-profgen.cpp

This is an archive of the discontinued LLVM Phabricator instance.

[llvm-profgen] Strip context to support non-CS profile generation for hybrid sampleClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 375664

llvm/test/tools/llvm-profgen/inline-cs-noprobe.test

llvm/test/tools/llvm-profgen/noinline-cs-noprobe.test

llvm/tools/llvm-profgen/PerfReader.h

llvm/tools/llvm-profgen/PerfReader.cpp

llvm/tools/llvm-profgen/ProfileGenerator.h

llvm/tools/llvm-profgen/ProfileGenerator.cpp

llvm/tools/llvm-profgen/llvm-profgen.cpp

[llvm-profgen] Strip context to support non-CS profile generation for hybrid sample
ClosedPublic