X-Git-Url: https://git.openstreetmap.org./nominatim.git/blobdiff_plain/8d4a86635fe661717a17fe3bb7ff2cde8a784158..cb70a2fde33e9c2455ea1cfb37ee430b00058b82:/test/php/Nominatim/PhraseTest.php?ds=inline diff --git a/test/php/Nominatim/PhraseTest.php b/test/php/Nominatim/PhraseTest.php index b5e6c1bf..e4c2bbd1 100644 --- a/test/php/Nominatim/PhraseTest.php +++ b/test/php/Nominatim/PhraseTest.php @@ -2,9 +2,32 @@ namespace Nominatim; -require_once '../../lib/Phrase.php'; +require_once(CONST_LibDir.'/Phrase.php'); -class PhraseTest extends \PHPUnit_Framework_TestCase +class TokensFullSet +{ + public function containsAny($sTerm) + { + return true; + } +} + +// phpcs:ignore PSR1.Classes.ClassDeclaration.MultipleClasses +class TokensPartialSet +{ + public function __construct($aTokens) + { + $this->aTokens = array_flip($aTokens); + } + + public function containsAny($sTerm) + { + return isset($this->aTokens[$sTerm]); + } +} + +// phpcs:ignore PSR1.Classes.ClassDeclaration.MultipleClasses +class PhraseTest extends \PHPUnit\Framework\TestCase { @@ -21,17 +44,16 @@ class PhraseTest extends \PHPUnit_Framework_TestCase public function testEmptyPhrase() { $oPhrase = new Phrase('', ''); + $oPhrase->computeWordSets(array(), new TokensFullSet()); - $this->assertEquals( - array(array('')), - $oPhrase->getWordSets() - ); + $this->assertNull($oPhrase->getWordSets()); } public function testSingleWordPhrase() { $oPhrase = new Phrase('a', ''); + $oPhrase->computeWordSets(array('a'), new TokensFullSet()); $this->assertEquals( '(a)', @@ -43,20 +65,23 @@ class PhraseTest extends \PHPUnit_Framework_TestCase public function testMultiWordPhrase() { $oPhrase = new Phrase('a b', ''); + $oPhrase->computeWordSets(array('a', 'b'), new TokensFullSet()); $this->assertEquals( '(a b),(a|b)', $this->serializeSets($oPhrase->getWordSets()) ); $oPhrase = new Phrase('a b c', ''); + $oPhrase->computeWordSets(array('a', 'b', 'c'), new TokensFullSet()); $this->assertEquals( - '(a b c),(a|b c),(a|b|c),(a b|c)', + '(a b c),(a|b c),(a b|c),(a|b|c)', $this->serializeSets($oPhrase->getWordSets()) ); $oPhrase = new Phrase('a b c d', ''); + $oPhrase->computeWordSets(array('a', 'b', 'c', 'd'), new TokensFullSet()); $this->assertEquals( - '(a b c d),(a|b c d),(a|b|c d),(a|b|c|d),(a|b c|d),(a b|c d),(a b|c|d),(a b c|d)', + '(a b c d),(a b c|d),(a b|c d),(a|b c d),(a b|c|d),(a|b c|d),(a|b|c d),(a|b|c|d)', $this->serializeSets($oPhrase->getWordSets()) ); } @@ -65,25 +90,50 @@ class PhraseTest extends \PHPUnit_Framework_TestCase public function testInverseWordSets() { $oPhrase = new Phrase('a b c', ''); + $oPhrase->computeWordSets(array('a', 'b', 'c'), new TokensFullSet()); $oPhrase->invertWordSets(); $this->assertEquals( - '(a b c),(c|a b),(c|b|a),(b c|a)', + '(a b c),(b c|a),(c|a b),(c|b|a)', $this->serializeSets($oPhrase->getWordSets()) ); } - public function testMaxDepth() + public function testMaxWordSets() { - $oPhrase = new Phrase(join(' ', array_fill(0, 4, 'a')), ''); + $aWords = array_fill(0, 4, 'a'); + $oPhrase = new Phrase(join(' ', $aWords), ''); + $oPhrase->computeWordSets($aWords, new TokensFullSet()); $this->assertEquals(8, count($oPhrase->getWordSets())); $oPhrase->invertWordSets(); $this->assertEquals(8, count($oPhrase->getWordSets())); - $oPhrase = new Phrase(join(' ', array_fill(0, 18, 'a')), ''); - $this->assertEquals(41226, count($oPhrase->getWordSets())); + $aWords = array_fill(0, 18, 'a'); + $oPhrase = new Phrase(join(' ', $aWords), ''); + $oPhrase->computeWordSets($aWords, new TokensFullSet()); + $this->assertEquals(100, count($oPhrase->getWordSets())); $oPhrase->invertWordSets(); - $this->assertEquals(41226, count($oPhrase->getWordSets())); + $this->assertEquals(100, count($oPhrase->getWordSets())); + } + + + public function testPartialTokensShortTerm() + { + $oPhrase = new Phrase('a b c d', ''); + $oPhrase->computeWordSets(array('a', 'b', 'c', 'd'), new TokensPartialSet(array('a', 'b', 'd', 'b c', 'b c d'))); + $this->assertEquals( + '(a|b c d),(a|b c|d)', + $this->serializeSets($oPhrase->getWordSets()) + ); + } + + + public function testPartialTokensLongTerm() + { + $aWords = array_fill(0, 18, 'a'); + $oPhrase = new Phrase(join(' ', $aWords), ''); + $oPhrase->computeWordSets($aWords, new TokensPartialSet(array('a', 'a a a a a'))); + $this->assertEquals(80, count($oPhrase->getWordSets())); } }