Index: tools/llvm-exegesis/lib/Clustering.cpp =================================================================== --- tools/llvm-exegesis/lib/Clustering.cpp +++ tools/llvm-exegesis/lib/Clustering.cpp @@ -8,7 +8,6 @@ //===----------------------------------------------------------------------===// #include "Clustering.h" -#include "llvm/ADT/SetVector.h" #include "llvm/ADT/SmallVector.h" #include @@ -92,8 +91,14 @@ } void InstructionBenchmarkClustering::dbScan(const size_t MinPts) { - std::vector Neighbors; // Persistent buffer to avoid allocs. - for (size_t P = 0, NumPoints = Points_.size(); P < NumPoints; ++P) { + const size_t NumPoints = Points_.size(); + + // Persistent buffers to avoid allocs. + std::vector Neighbors; + std::vector ToProcess(NumPoints); + std::vector Added(NumPoints); + + for (size_t P = 0; P < NumPoints; ++P) { if (!ClusterIdForPoint_[P].isUndef()) continue; // Previously processed in inner loop. rangeQuery(P, Neighbors); @@ -109,32 +114,35 @@ Cluster &CurrentCluster = Clusters_.back(); ClusterIdForPoint_[P] = CurrentCluster.Id; /* Label initial point */ CurrentCluster.PointIndices.push_back(P); + Added[P] = 1; // Process P's neighbors. - llvm::SetVector> ToProcess; - ToProcess.insert(Neighbors.begin(), Neighbors.end()); - while (!ToProcess.empty()) { + size_t Tail = 0; + for (size_t Q : Neighbors) + if (!Added[Q]) { + ToProcess[Tail++] = Q; + Added[Q] = 1; + } + for (size_t Head = 0; Head < Tail; ++Head) { // Retrieve a point from the set. - const size_t Q = *ToProcess.begin(); - ToProcess.erase(ToProcess.begin()); + P = ToProcess[Head]; - if (ClusterIdForPoint_[Q].isNoise()) { - // Change noise point to border point. - ClusterIdForPoint_[Q] = CurrentCluster.Id; - CurrentCluster.PointIndices.push_back(Q); + // Add P to the current custer. + ClusterId CID = ClusterIdForPoint_[P]; + ClusterIdForPoint_[P] = CurrentCluster.Id; + CurrentCluster.PointIndices.push_back(P); + if (CID.isNoise()) continue; - } - if (!ClusterIdForPoint_[Q].isUndef()) { - continue; // Previously processed. - } - // Add Q to the current custer. - ClusterIdForPoint_[Q] = CurrentCluster.Id; - CurrentCluster.PointIndices.push_back(Q); - // And extend to the neighbors of Q if the region is dense enough. - rangeQuery(Q, Neighbors); - if (Neighbors.size() + 1 >= MinPts) { - ToProcess.insert(Neighbors.begin(), Neighbors.end()); - } + assert(CID.isUndef()); + + // And extend to the neighbors of P if the region is dense enough. + rangeQuery(P, Neighbors); + if (Neighbors.size() + 1 >= MinPts) + for (size_t Q : Neighbors) + if (!Added[Q]) { + ToProcess[Tail++] = Q; + Added[Q] = 1; + } } } // assert(Neighbors.capacity() == (Points_.size() - 1));