X-Git-Url: https://git.openstreetmap.org./nominatim.git/blobdiff_plain/4e99f8a3408d59f5c6bf8d934fda7bb3726f2da2..4a2873617dcbaf58ff6135aa7d8dcb115c0cc5ba:/test/php/Nominatim/PhraseTest.php diff --git a/test/php/Nominatim/PhraseTest.php b/test/php/Nominatim/PhraseTest.php index db8d8b50..42166e34 100644 --- a/test/php/Nominatim/PhraseTest.php +++ b/test/php/Nominatim/PhraseTest.php @@ -2,10 +2,35 @@ namespace Nominatim; -require_once '../../lib/Phrase.php'; +require_once(CONST_LibDir.'/Phrase.php'); -class PhraseTest extends \PHPUnit_Framework_TestCase +class TokensFullSet { + public function containsAny($sTerm) + { + return true; + } +} + +// phpcs:ignore PSR1.Classes.ClassDeclaration.MultipleClasses +class TokensPartialSet +{ + public function __construct($aTokens) + { + $this->aTokens = array_flip($aTokens); + } + + public function containsAny($sTerm) + { + return isset($this->aTokens[$sTerm]); + } +} + +// phpcs:ignore PSR1.Classes.ClassDeclaration.MultipleClasses +class PhraseTest extends \PHPUnit\Framework\TestCase +{ + + private function serializeSets($aSets) { $aParts = array(); @@ -19,6 +44,7 @@ class PhraseTest extends \PHPUnit_Framework_TestCase public function testEmptyPhrase() { $oPhrase = new Phrase('', ''); + $oPhrase->computeWordSets(new TokensFullSet()); $this->assertEquals( array(array('')), @@ -30,6 +56,7 @@ class PhraseTest extends \PHPUnit_Framework_TestCase public function testSingleWordPhrase() { $oPhrase = new Phrase('a', ''); + $oPhrase->computeWordSets(new TokensFullSet()); $this->assertEquals( '(a)', @@ -41,20 +68,23 @@ class PhraseTest extends \PHPUnit_Framework_TestCase public function testMultiWordPhrase() { $oPhrase = new Phrase('a b', ''); + $oPhrase->computeWordSets(new TokensFullSet()); $this->assertEquals( '(a b),(a|b)', $this->serializeSets($oPhrase->getWordSets()) ); $oPhrase = new Phrase('a b c', ''); + $oPhrase->computeWordSets(new TokensFullSet()); $this->assertEquals( - '(a b c),(a|b c),(a|b|c),(a b|c)', + '(a b c),(a|b c),(a b|c),(a|b|c)', $this->serializeSets($oPhrase->getWordSets()) ); $oPhrase = new Phrase('a b c d', ''); + $oPhrase->computeWordSets(new TokensFullSet()); $this->assertEquals( - '(a b c d),(a|b c d),(a|b|c d),(a|b|c|d),(a|b c|d),(a b|c d),(a b|c|d),(a b c|d)', + '(a b c d),(a b c|d),(a b|c d),(a|b c d),(a b|c|d),(a|b c|d),(a|b|c d),(a|b|c|d)', $this->serializeSets($oPhrase->getWordSets()) ); } @@ -63,25 +93,47 @@ class PhraseTest extends \PHPUnit_Framework_TestCase public function testInverseWordSets() { $oPhrase = new Phrase('a b c', ''); + $oPhrase->computeWordSets(new TokensFullSet()); $oPhrase->invertWordSets(); $this->assertEquals( - '(a b c),(c|a b),(c|b|a),(b c|a)', + '(a b c),(b c|a),(c|a b),(c|b|a)', $this->serializeSets($oPhrase->getWordSets()) ); } - public function testMaxDepth() + public function testMaxWordSets() { $oPhrase = new Phrase(join(' ', array_fill(0, 4, 'a')), ''); + $oPhrase->computeWordSets(new TokensFullSet()); $this->assertEquals(8, count($oPhrase->getWordSets())); $oPhrase->invertWordSets(); $this->assertEquals(8, count($oPhrase->getWordSets())); $oPhrase = new Phrase(join(' ', array_fill(0, 18, 'a')), ''); - $this->assertEquals(41226, count($oPhrase->getWordSets())); + $oPhrase->computeWordSets(new TokensFullSet()); + $this->assertEquals(100, count($oPhrase->getWordSets())); $oPhrase->invertWordSets(); - $this->assertEquals(41226, count($oPhrase->getWordSets())); + $this->assertEquals(100, count($oPhrase->getWordSets())); + } + + + public function testPartialTokensShortTerm() + { + $oPhrase = new Phrase('a b c d', ''); + $oPhrase->computeWordSets(new TokensPartialSet(array('a', 'b', 'd', 'b c', 'b c d'))); + $this->assertEquals( + '(a|b c d),(a|b c|d)', + $this->serializeSets($oPhrase->getWordSets()) + ); + } + + + public function testPartialTokensLongTerm() + { + $oPhrase = new Phrase(join(' ', array_fill(0, 18, 'a')), ''); + $oPhrase->computeWordSets(new TokensPartialSet(array('a', 'a a a a a'))); + $this->assertEquals(80, count($oPhrase->getWordSets())); } }