Diff 113361

cfe/trunk/include/clang/Analysis/CloneDetection.h

Show First 20 Lines • Show All 246 Lines • ▼ Show 20 Lines	public:
/// \param Compare The comparison function that all clones are supposed to		/// \param Compare The comparison function that all clones are supposed to
/// pass. Should return true if and only if two clones belong		/// pass. Should return true if and only if two clones belong
/// to the same CloneGroup.		/// to the same CloneGroup.
static void splitCloneGroups(		static void splitCloneGroups(
std::vector<CloneDetector::CloneGroup> &CloneGroups,		std::vector<CloneDetector::CloneGroup> &CloneGroups,
std::function<bool(const StmtSequence &, const StmtSequence &)> Compare);		std::function<bool(const StmtSequence &, const StmtSequence &)> Compare);
};		};

/// Searches all children of the given clones for type II clones (i.e. they are		/// This constraint moves clones into clone groups of type II via hashing.
/// identical in every aspect beside the used variable names).		///
class RecursiveCloneTypeIIConstraint {		/// Clones with different hash values are moved into separate clone groups.
		/// Collisions are possible, and this constraint does nothing to address this
/// Generates and saves a hash code for the given Stmt.		/// them. Add the slower RecursiveCloneTypeIIVerifyConstraint later in the
/// \param S The given Stmt.		/// constraint chain, not necessarily immediately, to eliminate hash collisions
/// \param D The Decl containing S.		/// through a more detailed analysis.
/// \param StmtsByHash Output parameter that will contain the hash codes for		class RecursiveCloneTypeIIHashConstraint {
/// each StmtSequence in the given Stmt.		public:
/// \return The hash code of the given Stmt.		void constrain(std::vector<CloneDetector::CloneGroup> &Sequences);
///		};
/// If the given Stmt is a CompoundStmt, this method will also generate
/// hashes for all possible StmtSequences in the children of this Stmt.
size_t saveHash(const Stmt S, const Decl D,
std::vector<std::pair<size_t, StmtSequence>> &StmtsByHash);

		/// This constraint moves clones into clone groups of type II by comparing them.
		///
		/// Clones that aren't type II clones are moved into separate clone groups.
		/// In contrast to the RecursiveCloneTypeIIHashConstraint, all clones in a clone
		/// group are guaranteed to be be type II clones of each other, but it is too
		/// slow to efficiently handle large amounts of clones.
		class RecursiveCloneTypeIIVerifyConstraint {
public:		public:
void constrain(std::vector<CloneDetector::CloneGroup> &Sequences);		void constrain(std::vector<CloneDetector::CloneGroup> &Sequences);
};		};

/// Ensures that every clone has at least the given complexity.		/// Ensures that every clone has at least the given complexity.
///		///
/// Complexity is here defined as the total amount of children of a statement.		/// Complexity is here defined as the total amount of children of a statement.
/// This constraint assumes the first statement in the group is representative		/// This constraint assumes the first statement in the group is representative
▲ Show 20 Lines • Show All 160 Lines • Show Last 20 Lines

cfe/trunk/lib/Analysis/CloneDetection.cpp

Show First 20 Lines • Show All 232 Lines • ▼ Show 20 Lines	static size_t createHash(llvm::MD5 &Hash) {
// Copy as much as possible of the generated hash code to the Stmt's hash		// Copy as much as possible of the generated hash code to the Stmt's hash
// code.		// code.
std::memcpy(&HashCode, &HashResult,		std::memcpy(&HashCode, &HashResult,
std::min(sizeof(HashCode), sizeof(HashResult)));		std::min(sizeof(HashCode), sizeof(HashResult)));

return HashCode;		return HashCode;
}		}

size_t RecursiveCloneTypeIIConstraint::saveHash(		/// Generates and saves a hash code for the given Stmt.
const Stmt S, const Decl D,		/// \param S The given Stmt.
		/// \param D The Decl containing S.
		/// \param StmtsByHash Output parameter that will contain the hash codes for
		/// each StmtSequence in the given Stmt.
		/// \return The hash code of the given Stmt.
		///
		/// If the given Stmt is a CompoundStmt, this method will also generate
		/// hashes for all possible StmtSequences in the children of this Stmt.
		static size_t
		saveHash(const Stmt S, const Decl D,
std::vector<std::pair<size_t, StmtSequence>> &StmtsByHash) {		std::vector<std::pair<size_t, StmtSequence>> &StmtsByHash) {
llvm::MD5 Hash;		llvm::MD5 Hash;
ASTContext &Context = D->getASTContext();		ASTContext &Context = D->getASTContext();

CloneTypeIIStmtDataCollector<llvm::MD5>(S, Context, Hash);		CloneTypeIIStmtDataCollector<llvm::MD5>(S, Context, Hash);

auto CS = dyn_cast<CompoundStmt>(S);		auto CS = dyn_cast<CompoundStmt>(S);
SmallVector<size_t, 8> ChildHashes;		SmallVector<size_t, 8> ChildHashes;

▲ Show 20 Lines • Show All 83 Lines • ▼ Show 20 Lines	static bool areSequencesClones(const StmtSequence &LHS,
FoldingSetNodeIDWrapper RHSWrapper(DataRHS);		FoldingSetNodeIDWrapper RHSWrapper(DataRHS);

CollectStmtSequenceData(LHS, LHSWrapper);		CollectStmtSequenceData(LHS, LHSWrapper);
CollectStmtSequenceData(RHS, RHSWrapper);		CollectStmtSequenceData(RHS, RHSWrapper);

return DataLHS == DataRHS;		return DataLHS == DataRHS;
}		}

void RecursiveCloneTypeIIConstraint::constrain(		void RecursiveCloneTypeIIHashConstraint::constrain(
std::vector<CloneDetector::CloneGroup> &Sequences) {		std::vector<CloneDetector::CloneGroup> &Sequences) {
// FIXME: Maybe we can do this in-place and don't need this additional vector.		// FIXME: Maybe we can do this in-place and don't need this additional vector.
std::vector<CloneDetector::CloneGroup> Result;		std::vector<CloneDetector::CloneGroup> Result;

for (CloneDetector::CloneGroup &Group : Sequences) {		for (CloneDetector::CloneGroup &Group : Sequences) {
// We assume in the following code that the Group is non-empty, so we		// We assume in the following code that the Group is non-empty, so we
// skip all empty groups.		// skip all empty groups.
if (Group.empty())		if (Group.empty())
Show All 24 Lines	for (unsigned i = 0; i < StmtsByHash.size() - 1; ++i) {
// represent a CloneGroup, so we create a new group and start checking and		// represent a CloneGroup, so we create a new group and start checking and
// adding the StmtSequences in this sequence.		// adding the StmtSequences in this sequence.
CloneDetector::CloneGroup NewGroup;		CloneDetector::CloneGroup NewGroup;

size_t PrototypeHash = Current.first;		size_t PrototypeHash = Current.first;

for (; i < StmtsByHash.size(); ++i) {		for (; i < StmtsByHash.size(); ++i) {
// A different hash value means we have reached the end of the sequence.		// A different hash value means we have reached the end of the sequence.
if (PrototypeHash != StmtsByHash[i].first \|\|		if (PrototypeHash != StmtsByHash[i].first) {
!areSequencesClones(StmtsByHash[i].second, Current.second)) {
// The current sequence could be the start of a new CloneGroup. So we		// The current sequence could be the start of a new CloneGroup. So we
// decrement i so that we visit it again in the outer loop.		// decrement i so that we visit it again in the outer loop.
// Note: i can never be 0 at this point because we are just comparing		// Note: i can never be 0 at this point because we are just comparing
// the hash of the Current StmtSequence with itself in the 'if' above.		// the hash of the Current StmtSequence with itself in the 'if' above.
assert(i != 0);		assert(i != 0);
--i;		--i;
break;		break;
}		}
// Same hash value means we should add the StmtSequence to the current		// Same hash value means we should add the StmtSequence to the current
// group.		// group.
NewGroup.push_back(StmtsByHash[i].second);		NewGroup.push_back(StmtsByHash[i].second);
}		}

// We created a new clone group with matching hash codes and move it to		// We created a new clone group with matching hash codes and move it to
// the result vector.		// the result vector.
Result.push_back(NewGroup);		Result.push_back(NewGroup);
}		}
}		}
// Sequences is the output parameter, so we copy our result into it.		// Sequences is the output parameter, so we copy our result into it.
Sequences = Result;		Sequences = Result;
}		}

		void RecursiveCloneTypeIIVerifyConstraint::constrain(
		std::vector<CloneDetector::CloneGroup> &Sequences) {
		CloneConstraint::splitCloneGroups(
		Sequences, [](const StmtSequence &A, const StmtSequence &B) {
		return areSequencesClones(A, B);
		});
		}

size_t MinComplexityConstraint::calculateStmtComplexity(		size_t MinComplexityConstraint::calculateStmtComplexity(
const StmtSequence &Seq, const std::string &ParentMacroStack) {		const StmtSequence &Seq, const std::string &ParentMacroStack) {
if (Seq.empty())		if (Seq.empty())
return 0;		return 0;

size_t Complexity = 1;		size_t Complexity = 1;

ASTContext &Context = Seq.getASTContext();		ASTContext &Context = Seq.getASTContext();
▲ Show 20 Lines • Show All 197 Lines • Show Last 20 Lines

cfe/trunk/lib/StaticAnalyzer/Checkers/CloneChecker.cpp

Show First 20 Lines • Show All 75 Lines • ▼ Show 20 Lines	void CloneChecker::checkEndOfTranslationUnit(const TranslationUnitDecl *TU,
StringRef IgnoredFilesPattern = Mgr.getAnalyzerOptions().getOptionAsString(		StringRef IgnoredFilesPattern = Mgr.getAnalyzerOptions().getOptionAsString(
"IgnoredFilesPattern", "", this);		"IgnoredFilesPattern", "", this);

// Let the CloneDetector create a list of clones from all the analyzed		// Let the CloneDetector create a list of clones from all the analyzed
// statements. We don't filter for matching variable patterns at this point		// statements. We don't filter for matching variable patterns at this point
// because reportSuspiciousClones() wants to search them for errors.		// because reportSuspiciousClones() wants to search them for errors.
std::vector<CloneDetector::CloneGroup> AllCloneGroups;		std::vector<CloneDetector::CloneGroup> AllCloneGroups;

Detector.findClones(AllCloneGroups,		Detector.findClones(
FilenamePatternConstraint(IgnoredFilesPattern),		AllCloneGroups, FilenamePatternConstraint(IgnoredFilesPattern),
RecursiveCloneTypeIIConstraint(),		RecursiveCloneTypeIIHashConstraint(), MinGroupSizeConstraint(2),
MinComplexityConstraint(MinComplexity),		MinComplexityConstraint(MinComplexity),
MinGroupSizeConstraint(2), OnlyLargestCloneConstraint());		RecursiveCloneTypeIIVerifyConstraint(), OnlyLargestCloneConstraint());

if (ReportSuspiciousClones)		if (ReportSuspiciousClones)
reportSuspiciousClones(BR, Mgr, AllCloneGroups);		reportSuspiciousClones(BR, Mgr, AllCloneGroups);

// We are done for this translation unit unless we also need to report normal		// We are done for this translation unit unless we also need to report normal
// clones.		// clones.
if (!ReportNormalClones)		if (!ReportNormalClones)
return;		return;
▲ Show 20 Lines • Show All 108 Lines • Show Last 20 Lines

cfe/trunk/unittests/Analysis/CloneDetectionTest.cpp

Show First 20 Lines • Show All 63 Lines • ▼ Show 20 Lines	TEST(CloneDetector, FilterFunctionsByName) {
// Push all the function bodies into the detector.		// Push all the function bodies into the detector.
CloneDetectionVisitor Visitor(Detector);		CloneDetectionVisitor Visitor(Detector);
Visitor.TraverseTranslationUnitDecl(TU);		Visitor.TraverseTranslationUnitDecl(TU);

// Find clones with the usual settings, but but we want to filter out		// Find clones with the usual settings, but but we want to filter out
// all statements from functions which names start with "bar".		// all statements from functions which names start with "bar".
std::vector<CloneDetector::CloneGroup> CloneGroups;		std::vector<CloneDetector::CloneGroup> CloneGroups;
Detector.findClones(CloneGroups, NoBarFunctionConstraint(),		Detector.findClones(CloneGroups, NoBarFunctionConstraint(),
RecursiveCloneTypeIIConstraint(),		RecursiveCloneTypeIIHashConstraint(),
MinComplexityConstraint(2), MinGroupSizeConstraint(2),		MinComplexityConstraint(2), MinGroupSizeConstraint(2),
		RecursiveCloneTypeIIVerifyConstraint(),
OnlyLargestCloneConstraint());		OnlyLargestCloneConstraint());

ASSERT_EQ(CloneGroups.size(), 1u);		ASSERT_EQ(CloneGroups.size(), 1u);
ASSERT_EQ(CloneGroups.front().size(), 2u);		ASSERT_EQ(CloneGroups.front().size(), 2u);

for (auto &Clone : CloneGroups.front()) {		for (auto &Clone : CloneGroups.front()) {
const auto ND = dyn_cast<const FunctionDecl>(Clone.getContainingDecl());		const auto ND = dyn_cast<const FunctionDecl>(Clone.getContainingDecl());
ASSERT_TRUE(ND != nullptr);		ASSERT_TRUE(ND != nullptr);
// Check that no function name starting with "bar" is in the results...		// Check that no function name starting with "bar" is in the results...
ASSERT_TRUE(ND->getNameAsString().find("bar") != 0);		ASSERT_TRUE(ND->getNameAsString().find("bar") != 0);
}		}

// Retry above's example without the filter...		// Retry above's example without the filter...
CloneGroups.clear();		CloneGroups.clear();

Detector.findClones(CloneGroups, RecursiveCloneTypeIIConstraint(),		Detector.findClones(CloneGroups, RecursiveCloneTypeIIHashConstraint(),
MinComplexityConstraint(2), MinGroupSizeConstraint(2),		MinComplexityConstraint(2), MinGroupSizeConstraint(2),
		RecursiveCloneTypeIIVerifyConstraint(),
OnlyLargestCloneConstraint());		OnlyLargestCloneConstraint());
ASSERT_EQ(CloneGroups.size(), 1u);		ASSERT_EQ(CloneGroups.size(), 1u);
ASSERT_EQ(CloneGroups.front().size(), 4u);		ASSERT_EQ(CloneGroups.front().size(), 4u);

// Count how many functions with the bar prefix we have in the results.		// Count how many functions with the bar prefix we have in the results.
int FoundFunctionsWithBarPrefix = 0;		int FoundFunctionsWithBarPrefix = 0;
for (auto &Clone : CloneGroups.front()) {		for (auto &Clone : CloneGroups.front()) {
const auto ND = dyn_cast<const FunctionDecl>(Clone.getContainingDecl());		const auto ND = dyn_cast<const FunctionDecl>(Clone.getContainingDecl());
Show All 12 Lines

This is an archive of the discontinued LLVM Phabricator instance.

[analyzer] Performance optimizations for the CloneChecker
ClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 113361

cfe/trunk/include/clang/Analysis/CloneDetection.h

cfe/trunk/lib/Analysis/CloneDetection.cpp

cfe/trunk/lib/StaticAnalyzer/Checkers/CloneChecker.cpp

cfe/trunk/unittests/Analysis/CloneDetectionTest.cpp

This is an archive of the discontinued LLVM Phabricator instance.

[analyzer] Performance optimizations for the CloneCheckerClosedPublic

Details

Diff Detail

Event Timeline

Revision Contents

Diff 113361

cfe/trunk/include/clang/Analysis/CloneDetection.h

cfe/trunk/lib/Analysis/CloneDetection.cpp

cfe/trunk/lib/StaticAnalyzer/Checkers/CloneChecker.cpp

cfe/trunk/unittests/Analysis/CloneDetectionTest.cpp

[analyzer] Performance optimizations for the CloneChecker
ClosedPublic