Skip to content
This repository has been archived by the owner on Feb 5, 2019. It is now read-only.

Commit

Permalink
Extend StringRef's edit-distance algorithm to permit an upper bound o…
Browse files Browse the repository at this point in the history
…n the allowed edit distance

git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@116867 91177308-0d34-0410-b5e6-96231b3b80d8
  • Loading branch information
DougGregor committed Oct 19, 2010
1 parent 8155ea4 commit 5ee568a
Show file tree
Hide file tree
Showing 2 changed files with 14 additions and 2 deletions.
7 changes: 6 additions & 1 deletion include/llvm/ADT/StringRef.h
Original file line number Diff line number Diff line change
Expand Up @@ -142,11 +142,16 @@ namespace llvm {
/// operation, rather than as two operations (an insertion and a
/// removal).
///
/// \param MaxEditDistance If non-zero, the maximum edit distance that
/// this routine is allowed to compute. If the edit distance will exceed
/// that maximum, returns \c MaxEditDistance+1.
///
/// \returns the minimum number of character insertions, removals,
/// or (if \p AllowReplacements is \c true) replacements needed to
/// transform one of the given strings into the other. If zero,
/// the strings are identical.
unsigned edit_distance(StringRef Other, bool AllowReplacements = true);
unsigned edit_distance(StringRef Other, bool AllowReplacements = true,
unsigned MaxEditDistance = 0);

/// str - Get the contents as an std::string.
std::string str() const {
Expand Down
9 changes: 8 additions & 1 deletion lib/Support/StringRef.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -68,7 +68,8 @@ int StringRef::compare_numeric(StringRef RHS) const {

// Compute the edit distance between the two given strings.
unsigned StringRef::edit_distance(llvm::StringRef Other,
bool AllowReplacements) {
bool AllowReplacements,
unsigned MaxEditDistance) {
// The algorithm implemented below is the "classic"
// dynamic-programming algorithm for computing the Levenshtein
// distance, which is described here:
Expand All @@ -94,6 +95,8 @@ unsigned StringRef::edit_distance(llvm::StringRef Other,

for (size_type y = 1; y <= m; ++y) {
current[0] = y;
unsigned BestThisRow = current[0];

for (size_type x = 1; x <= n; ++x) {
if (AllowReplacements) {
current[x] = min(previous[x-1] + ((*this)[y-1] == Other[x-1]? 0u:1u),
Expand All @@ -103,8 +106,12 @@ unsigned StringRef::edit_distance(llvm::StringRef Other,
if ((*this)[y-1] == Other[x-1]) current[x] = previous[x-1];
else current[x] = min(current[x-1], previous[x]) + 1;
}
BestThisRow = min(BestThisRow, current[x]);
}

if (MaxEditDistance && BestThisRow > MaxEditDistance)
return MaxEditDistance + 1;

unsigned *tmp = current;
current = previous;
previous = tmp;
Expand Down

0 comments on commit 5ee568a

Please sign in to comment.