1
0
mirror of https://github.com/robonen/tools.git synced 2026-03-20 10:54:44 +00:00

feat(packages/stdlib): levenshtein distance util

This commit is contained in:
2024-04-11 00:11:29 +07:00
parent 65ba312f4c
commit 002215303a
3 changed files with 77 additions and 0 deletions

View File

@@ -0,0 +1 @@
export * from './levenshtein-distance';

View File

@@ -0,0 +1,32 @@
import { describe, expect, it } from 'vitest';
import levenshteinDistance from '.';
describe('levenshteinDistance', () => {
it('should calculate edit distance between two strings', () => {
// just one substitution I at the beginning
expect(levenshteinDistance('islander', 'slander')).toBe(1);
// substitution M->K, T->M and add an A to the end
expect(levenshteinDistance('mart', 'karma')).toBe(3);
// substitution K->S, E->I and insert G at the end
expect(levenshteinDistance('kitten', 'sitting')).toBe(3);
// should add 4 letters FOOT at the beginning
expect(levenshteinDistance('ball', 'football')).toBe(4);
// should delete 4 letters FOOT at the beginning
expect(levenshteinDistance('football', 'foot')).toBe(4);
// needs to substitute the first 5 chars INTEN->EXECU
expect(levenshteinDistance('intention', 'execution')).toBe(5);
});
it('should handle edge cases', () => {
expect(levenshteinDistance('', '')).toBe(0);
expect(levenshteinDistance('a', '')).toBe(1);
expect(levenshteinDistance('', 'a')).toBe(1);
expect(levenshteinDistance('abc', '')).toBe(3);
expect(levenshteinDistance('', 'abc')).toBe(3);
});
});

View File

@@ -0,0 +1,44 @@
/**
* Calculate the Levenshtein distance between two strings
*
* @param {string} a First string
* @param {string} b Second string
* @returns {number} The Levenshtein distance between the two strings
*/
export default function levenshteinDistance(a: string, b: string): number {
// If the strings are equal, the distance is 0
if (a === b) return 0;
// If either string is empty, the distance is the length of the other string
if (a.length === 0) return b.length;
if (b.length === 0) return a.length;
// Create empty edit distance matrix for all possible modifications of
// substrings of a to substrings of b
const distanceMatrix = Array(b.length + 1).fill(null).map(() => Array(a.length + 1).fill(null));
// Fill the first row of the matrix
// If this is the first row, we're transforming from an empty string to a
// In this case, the number of operations equals the length of a substring
for (let i = 0; i <= a.length; i++)
distanceMatrix[0]![i]! = i;
// Fill the first column of the matrix
// If this is the first column, we're transforming empty string to b
// In this case, the number of operations equals the length of b substring
for (let j = 0; j <= b.length; j++)
distanceMatrix[j]![0]! = j;
for (let j = 1; j <= b.length; j++) {
for (let i = 1; i <= a.length; i++) {
const indicator = a[i - 1] === b[j - 1] ? 0 : 1;
distanceMatrix[j]![i]! = Math.min(
distanceMatrix[j]![i - 1]! + 1, // deletion
distanceMatrix[j - 1]![i]! + 1, // insertion
distanceMatrix[j - 1]![i - 1]! + indicator // substitution
);
}
}
return distanceMatrix[b.length]![a.length]!;
}