2020-10-29 00:11:21 -03:00
|
|
|
<?php
|
2023-10-04 21:36:11 +03:30
|
|
|
|
2020-10-29 00:11:21 -03:00
|
|
|
/**
|
2022-07-24 00:55:07 -06:00
|
|
|
* Find distance (Levenshtein distance)
|
|
|
|
*
|
2020-10-29 00:11:21 -03:00
|
|
|
* Compute the difference between two sequences, ie, the minimum number of changes
|
|
|
|
* to get to $str2 from $str1
|
2022-07-24 00:55:07 -06:00
|
|
|
*
|
2020-10-29 00:11:21 -03:00
|
|
|
* @param string $str1
|
|
|
|
* @param string $str2
|
|
|
|
* @return int the minimum number of changes to transform one string into another
|
|
|
|
*/
|
2022-07-24 00:55:07 -06:00
|
|
|
function findDistance($str1, $str2)
|
2020-10-29 00:11:21 -03:00
|
|
|
{
|
|
|
|
$lenStr1 = strlen($str1);
|
|
|
|
$lenStr2 = strlen($str2);
|
|
|
|
if ($lenStr1 == 0) {
|
|
|
|
return $lenStr2;
|
|
|
|
}
|
|
|
|
|
|
|
|
if ($lenStr2 == 0) {
|
|
|
|
return $lenStr1;
|
|
|
|
}
|
|
|
|
|
|
|
|
$distanceVectorInit = [];
|
|
|
|
$distanceVectorFinal = [];
|
2022-07-24 00:55:07 -06:00
|
|
|
|
2020-10-29 00:11:21 -03:00
|
|
|
for ($i = 0; $i < $lenStr1 + 1; $i++) {
|
|
|
|
$distanceVectorInit[] = 0;
|
|
|
|
$distanceVectorFinal[] = 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
for ($i = 0; $i < $lenStr1 + 1; $i++) {
|
|
|
|
$distanceVectorInit[$i] = $i;
|
|
|
|
}
|
|
|
|
|
|
|
|
for ($i = 0; $i < $lenStr2; $i++) {
|
|
|
|
$distanceVectorFinal[0] = $i + 1;
|
2022-07-24 00:55:07 -06:00
|
|
|
|
2020-10-29 00:11:21 -03:00
|
|
|
// use formula to fill in the rest of the row
|
|
|
|
for ($j = 0; $j < $lenStr1; $j++) {
|
|
|
|
$substitutionCost = 0;
|
|
|
|
if ($str1[$j] == $str2[$i]) {
|
|
|
|
$substitutionCost = $distanceVectorInit[$j];
|
|
|
|
} else {
|
|
|
|
$substitutionCost = $distanceVectorInit[$j] + 1;
|
|
|
|
}
|
|
|
|
|
2023-10-04 21:36:11 +03:30
|
|
|
$distanceVectorFinal[$j + 1] = min($distanceVectorInit[$j + 1] + 1, min($distanceVectorFinal[$j] + 1, $substitutionCost));
|
2020-10-29 00:11:21 -03:00
|
|
|
}
|
|
|
|
|
|
|
|
$distanceVectorInit = $distanceVectorFinal;
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
return $distanceVectorFinal[$lenStr1];
|
2022-07-24 00:55:07 -06:00
|
|
|
}
|