if ($bVerbose) {
echo "\n";
}
+
+ $oTokenizer = new \Nominatim\Tokenizer($oDB);
+
+ $aWords = $oTokenizer->mostFrequentWords(1000);
+
$sSQL = 'SELECT word FROM word WHERE word is not null ORDER BY search_name_count DESC LIMIT 1000';
- foreach ($oDB->getCol($sSQL) as $sWord) {
+ foreach ($aWords as $sWord) {
if ($bVerbose) {
echo "$sWord = ";
}
return $this->oNormalizer->transliterate($sTerm);
}
+
+ public function mostFrequentWords($iNum)
+ {
+ $sSQL = "SELECT word FROM word WHERE type = 'W'";
+ $sSQL .= "ORDER BY info->'count' DESC LIMIT ".$iNum;
+ return $this->oDB->getCol($sSQL);
+ }
+
+
private function makeStandardWord($sTerm)
{
return trim($this->oTransliterator->transliterate(' '.$sTerm.' '));
}
+ public function mostFrequentWords($iNum)
+ {
+ $sSQL = 'SELECT word FROM word WHERE word is not null ';
+ $sSQL .= 'ORDER BY search_name_count DESC LIMIT '.$iNum;
+ return $this->oDB->getCol($sSQL);
+ }
+
+
public function tokensForSpecialTerm($sTerm)
{
$aResults = array();