Update fuzz.php

Set the strings in lower case to avoid missing results because of the case.
This commit is contained in:
znvcx 2022-11-23 20:19:36 +00:00 committed by GitHub
parent 55d3b162bf
commit 64612b85f9
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23

View file

@ -34,6 +34,7 @@ class Fuzz
*/
public function __construct($source, $maxResults, $searchMode, $useLCS)
{
$this->_source = $source;
$this->_sourceLen = count($source);
$this->_maxResults = max($maxResults, 1);
@ -61,6 +62,9 @@ class Fuzz
$results = [];
$scores = [];
// put the text in lower case to avoid missing a result because of the case
$search = strtolower($search);
// Nullify these parameters if they are irrelevant to searchMode
if (!$this->_useLCS) $minLCS = null;
if ($this->_searchMode != 0) $maxDistance = null;
@ -125,6 +129,11 @@ class Fuzz
{
$suffix = [];
$result = 0;
// put the text in lower case to avoid missing a result because of the case
$source = strtolower($source);
$target = strtolower($target);
$n = mb_strlen($source, CHARSET);
$m = mb_strlen($target, CHARSET);
@ -158,6 +167,10 @@ class Fuzz
$n = mb_strlen($source, CHARSET);
$m = mb_strlen($target, CHARSET);
// put the text in lower case to avoid missing a result because of the case
$source = strtolower($source);
$target = strtolower($target);
if ($n === 0) {
return $m;
} elseif ($m === 0) {
@ -205,8 +218,12 @@ class Fuzz
*/
public function getJaroWinkler($first, $second)
{
$shorter = '';
$longer = '';
$shorter;
$longer;
// put the text in lower case to avoid missing a result because of the case
$first = strtolower($first);
$second = strtolower($second);
if (mb_strlen($first, CHARSET) > mb_strlen($second, CHARSET)) {
$longer = mb_strtolower($first, CHARSET);
@ -255,6 +272,11 @@ class Fuzz
{
$common = '';
$copy = $second;
// put the text in lower case to avoid missing a result because of the case
$first = strtolower($first);
$second = strtolower($second);
$firstLen = mb_strlen($first, CHARSET);
$secondLen = mb_strlen($second, CHARSET);
@ -285,6 +307,11 @@ class Fuzz
private function _getTranspositions($first, $second)
{
$trans = 0;
// put the text in lower case to avoid missing a result because of the case
$first = strtolower($first);
$second = strtolower($second);
$firstLen = mb_strlen($first, CHARSET);
for ($i = 0; $i < $firstLen; $i++) {
@ -307,6 +334,10 @@ class Fuzz
*/
private function _getPrefix($first, $second)
{
// put the text in lower case to avoid missing a result because of the case
$first = strtolower($first);
$second = strtolower($second);
if (mb_strlen($first, CHARSET) == 0 || mb_strlen($second, CHARSET) == 0) {
return '';
}
@ -331,6 +362,10 @@ class Fuzz
*/
private function _getDiffIndex($first, $second)
{
// put the text in lower case to avoid missing a result because of the case
$first = strtolower($first);
$second = strtolower($second);
if ($first == $second) {
return -1;
}