diff --git a/llvm/include/llvm/ADT/StringRef.h b/llvm/include/llvm/ADT/StringRef.h --- a/llvm/include/llvm/ADT/StringRef.h +++ b/llvm/include/llvm/ADT/StringRef.h @@ -240,6 +240,10 @@ unsigned edit_distance(StringRef Other, bool AllowReplacements = true, unsigned MaxEditDistance = 0) const; + LLVM_NODISCARD unsigned + edit_distance_insensitive(StringRef Other, bool AllowReplacements = true, + unsigned MaxEditDistance = 0) const; + /// str - Get the contents as an std::string. LLVM_NODISCARD std::string str() const { diff --git a/llvm/include/llvm/ADT/edit_distance.h b/llvm/include/llvm/ADT/edit_distance.h --- a/llvm/include/llvm/ADT/edit_distance.h +++ b/llvm/include/llvm/ADT/edit_distance.h @@ -36,13 +36,17 @@ /// routine is allowed to compute. If the edit distance will exceed that /// maximum, returns \c MaxEditDistance+1. /// +/// \param Map A Functor to apply to each item of the sequences before +/// comparison. If unspecified, this maps to itself. +/// /// \returns the minimum number of element insertions, removals, or (if /// \p AllowReplacements is \c true) replacements needed to transform one of /// the given sequences into the other. If zero, the sequences are identical. -template -unsigned ComputeEditDistance(ArrayRef FromArray, ArrayRef ToArray, - bool AllowReplacements = true, - unsigned MaxEditDistance = 0) { +template +unsigned ComputeEditDistance( + ArrayRef FromArray, ArrayRef ToArray, bool AllowReplacements = true, + unsigned MaxEditDistance = 0, + Functor Map = [](const T &X) -> const T & { return X; }) { // The algorithm implemented below is the "classic" // dynamic-programming algorithm for computing the Levenshtein // distance, which is described here: @@ -79,11 +83,12 @@ int OldRow = Row[x]; if (AllowReplacements) { Row[x] = std::min( - Previous + (FromArray[y-1] == ToArray[x-1] ? 0u : 1u), - std::min(Row[x-1], Row[x])+1); + Previous + (Map(FromArray[y - 1]) == Map(ToArray[x - 1]) ? 0u : 1u), + std::min(Row[x - 1], Row[x]) + 1); } else { - if (FromArray[y-1] == ToArray[x-1]) Row[x] = Previous; + if (Map(FromArray[y - 1]) == Map(ToArray[x - 1])) + Row[x] = Previous; else Row[x] = std::min(Row[x-1], Row[x]) + 1; } Previous = OldRow; diff --git a/llvm/lib/Support/StringRef.cpp b/llvm/lib/Support/StringRef.cpp --- a/llvm/lib/Support/StringRef.cpp +++ b/llvm/lib/Support/StringRef.cpp @@ -98,6 +98,13 @@ AllowReplacements, MaxEditDistance); } +unsigned llvm::StringRef::edit_distance_insensitive( + StringRef Other, bool AllowReplacements, unsigned MaxEditDistance) const { + return llvm::ComputeEditDistance( + makeArrayRef(data(), size()), makeArrayRef(Other.data(), Other.size()), + AllowReplacements, MaxEditDistance, llvm::toLower); +} + //===----------------------------------------------------------------------===// // String Operations //===----------------------------------------------------------------------===// diff --git a/llvm/unittests/ADT/StringRefTest.cpp b/llvm/unittests/ADT/StringRefTest.cpp --- a/llvm/unittests/ADT/StringRefTest.cpp +++ b/llvm/unittests/ADT/StringRefTest.cpp @@ -584,6 +584,15 @@ "people soiled our green ")); } +TEST(StringRefTest, EditDistanceInsensitive) { + StringRef Hello("HELLO"); + EXPECT_EQ(2U, Hello.edit_distance_insensitive("hill")); + EXPECT_EQ(0U, Hello.edit_distance_insensitive("hello")); + + StringRef Industry("InDuStRy"); + EXPECT_EQ(6U, Industry.edit_distance_insensitive("iNtErEsT")); +} + TEST(StringRefTest, Misc) { std::string Storage; raw_string_ostream OS(Storage);