Files
pytorch/torch/csrc/jit/frontend/edit_distance.cpp
cyy 70d7638b0d Fix clang-tidy suppression in torch/csrc/jit (#152271)
Remove some clang-tidy suppression in torch/csrc/jit by applying fixes or refactoring.

Pull Request resolved: https://github.com/pytorch/pytorch/pull/152271
Approved by: https://github.com/Skylion007, https://github.com/malfet

Co-authored-by: Aaron Gokaslan <aaronGokaslan@gmail.com>
2025-04-27 21:18:39 +00:00

56 lines
1.6 KiB
C++

#include <torch/csrc/jit/frontend/edit_distance.h>
#include <algorithm>
#include <cstring>
#include <memory>
namespace torch::jit {
// computes levenshtein edit distance between two words
// returns maxEditDistance + 1 if the edit distance exceeds MaxEditDistance
// reference: http://llvm.org/doxygen/edit__distance_8h_source.html
size_t ComputeEditDistance(
const char* word1,
const char* word2,
size_t maxEditDistance) {
size_t m = std::strlen(word1);
size_t n = std::strlen(word2);
constexpr unsigned small_buffer_size = 64;
// NOLINTNEXTLINE(cppcoreguidelines-avoid-c-arrays,modernize-avoid-c-arrays)
unsigned small_buffer[small_buffer_size];
// NOLINTNEXTLINE(cppcoreguidelines-avoid-c-arrays,modernize-avoid-c-arrays)
std::unique_ptr<unsigned[]> allocated;
unsigned* row = small_buffer;
if (n + 1 > small_buffer_size) {
row = new unsigned[n + 1];
allocated.reset(row);
}
for (unsigned i = 1; i <= n; ++i)
row[i] = i;
for (size_t y = 1; y <= m; ++y) {
row[0] = y;
unsigned best_this_row = row[0];
unsigned previous = y - 1;
for (size_t x = 1; x <= n; ++x) {
const auto old_row = row[x];
row[x] = std::min(
previous + (word1[y - 1] == word2[x - 1] ? 0u : 1u),
std::min(row[x - 1], row[x]) + 1);
previous = old_row;
best_this_row = std::min(best_this_row, row[x]);
}
if (maxEditDistance && best_this_row > maxEditDistance)
return maxEditDistance + 1;
}
// NOLINTNEXTLINE(clang-analyzer-core.uninitialized.Assign)
unsigned result = row[n];
return result;
}
} // namespace torch::jit