oDB =& $oDB; $this->oPlaceLookup = new PlaceLookup($this->oDB); $this->oTokenizer = new \Nominatim\Tokenizer($this->oDB); } public function setLanguagePreference($aLangPref) { $this->aLangPrefOrder = $aLangPref; } public function getMoreUrlParams() { if ($this->aStructuredQuery) { $aParams = $this->aStructuredQuery; } else { $aParams = array('q' => $this->sQuery); } $aParams = array_merge($aParams, $this->oPlaceLookup->getMoreUrlParams()); if ($this->aExcludePlaceIDs) { $aParams['exclude_place_ids'] = implode(',', $this->aExcludePlaceIDs); } if ($this->bBoundedSearch) { $aParams['bounded'] = '1'; } if ($this->aCountryCodes) { $aParams['countrycodes'] = implode(',', $this->aCountryCodes); } if ($this->aViewBox) { $aParams['viewbox'] = join(',', $this->aViewBox); } return $aParams; } public function setLimit($iLimit = 10) { if ($iLimit > 50) { $iLimit = 50; } elseif ($iLimit < 1) { $iLimit = 1; } $this->iFinalLimit = $iLimit; $this->iLimit = $iLimit + min($iLimit, 10); } public function setFeatureType($sFeatureType) { switch ($sFeatureType) { case 'country': $this->setRankRange(4, 4); break; case 'state': $this->setRankRange(8, 8); break; case 'city': $this->setRankRange(14, 16); break; case 'settlement': $this->setRankRange(8, 20); break; } } public function setRankRange($iMin, $iMax) { $this->iMinAddressRank = $iMin; $this->iMaxAddressRank = $iMax; } public function setViewbox($aViewbox) { $aBox = array_map('floatval', $aViewbox); $this->aViewBox[0] = max(-180.0, min($aBox[0], $aBox[2])); $this->aViewBox[1] = max(-90.0, min($aBox[1], $aBox[3])); $this->aViewBox[2] = min(180.0, max($aBox[0], $aBox[2])); $this->aViewBox[3] = min(90.0, max($aBox[1], $aBox[3])); if ($this->aViewBox[2] - $this->aViewBox[0] < 0.000000001 || $this->aViewBox[3] - $this->aViewBox[1] < 0.000000001 ) { userError("Bad parameter 'viewbox'. Not a box."); } } private function viewboxImportanceFactor($fX, $fY) { if (!$this->aViewBox) { return 1; } $fWidth = ($this->aViewBox[2] - $this->aViewBox[0])/2; $fHeight = ($this->aViewBox[3] - $this->aViewBox[1])/2; $fXDist = abs($fX - ($this->aViewBox[0] + $this->aViewBox[2])/2); $fYDist = abs($fY - ($this->aViewBox[1] + $this->aViewBox[3])/2); if ($fXDist <= $fWidth && $fYDist <= $fHeight) { return 1; } if ($fXDist <= $fWidth * 3 && $fYDist <= 3 * $fHeight) { return 0.5; } return 0.25; } public function setQuery($sQueryString) { $this->sQuery = $sQueryString; $this->aStructuredQuery = false; } public function getQueryString() { return $this->sQuery; } public function loadParamArray($oParams, $sForceGeometryType = null) { $this->bBoundedSearch = $oParams->getBool('bounded', $this->bBoundedSearch); $this->setLimit($oParams->getInt('limit', $this->iFinalLimit)); $this->iOffset = $oParams->getInt('offset', $this->iOffset); $this->bFallback = $oParams->getBool('fallback', $this->bFallback); // List of excluded Place IDs - used for more acurate pageing $sExcluded = $oParams->getStringList('exclude_place_ids'); if ($sExcluded) { foreach ($sExcluded as $iExcludedPlaceID) { $iExcludedPlaceID = (int)$iExcludedPlaceID; if ($iExcludedPlaceID) { $aExcludePlaceIDs[$iExcludedPlaceID] = $iExcludedPlaceID; } } if (isset($aExcludePlaceIDs)) { $this->aExcludePlaceIDs = $aExcludePlaceIDs; } } // Only certain ranks of feature $sFeatureType = $oParams->getString('featureType'); if (!$sFeatureType) { $sFeatureType = $oParams->getString('featuretype'); } if ($sFeatureType) { $this->setFeatureType($sFeatureType); } // Country code list $sCountries = $oParams->getStringList('countrycodes'); if ($sCountries) { foreach ($sCountries as $sCountryCode) { if (preg_match('/^[a-zA-Z][a-zA-Z]$/', $sCountryCode)) { $aCountries[] = strtolower($sCountryCode); } } if (isset($aCountries)) { $this->aCountryCodes = $aCountries; } } $aViewbox = $oParams->getStringList('viewboxlbrt'); if ($aViewbox) { if (count($aViewbox) != 4) { userError("Bad parameter 'viewboxlbrt'. Expected 4 coordinates."); } $this->setViewbox($aViewbox); } else { $aViewbox = $oParams->getStringList('viewbox'); if ($aViewbox) { if (count($aViewbox) != 4) { userError("Bad parameter 'viewbox'. Expected 4 coordinates."); } $this->setViewBox($aViewbox); } else { $aRoute = $oParams->getStringList('route'); $fRouteWidth = $oParams->getFloat('routewidth'); if ($aRoute && $fRouteWidth) { $this->aRoutePoints = $aRoute; $this->aRouteWidth = $fRouteWidth; } } } $this->oPlaceLookup->loadParamArray($oParams, $sForceGeometryType); $this->oPlaceLookup->setIncludeAddressDetails($oParams->getBool('addressdetails', false)); } public function setQueryFromParams($oParams) { // Search query $sQuery = $oParams->getString('q'); if (!$sQuery) { $this->setStructuredQuery( $oParams->getString('amenity'), $oParams->getString('street'), $oParams->getString('city'), $oParams->getString('county'), $oParams->getString('state'), $oParams->getString('country'), $oParams->getString('postalcode') ); } else { $this->setQuery($sQuery); } } public function loadStructuredAddressElement($sValue, $sKey, $iNewMinAddressRank, $iNewMaxAddressRank, $aItemListValues) { $sValue = trim($sValue); if (!$sValue) { return false; } $this->aStructuredQuery[$sKey] = $sValue; if ($this->iMinAddressRank == 0 && $this->iMaxAddressRank == 30) { $this->iMinAddressRank = $iNewMinAddressRank; $this->iMaxAddressRank = $iNewMaxAddressRank; } if ($aItemListValues) { $this->aAddressRankList = array_merge($this->aAddressRankList, $aItemListValues); } return true; } public function setStructuredQuery($sAmenity = false, $sStreet = false, $sCity = false, $sCounty = false, $sState = false, $sCountry = false, $sPostalCode = false) { $this->sQuery = false; // Reset $this->iMinAddressRank = 0; $this->iMaxAddressRank = 30; $this->aAddressRankList = array(); $this->aStructuredQuery = array(); $this->sAllowedTypesSQLList = false; $this->loadStructuredAddressElement($sAmenity, 'amenity', 26, 30, false); $this->loadStructuredAddressElement($sStreet, 'street', 26, 30, false); $this->loadStructuredAddressElement($sCity, 'city', 14, 24, false); $this->loadStructuredAddressElement($sCounty, 'county', 9, 13, false); $this->loadStructuredAddressElement($sState, 'state', 8, 8, false); $this->loadStructuredAddressElement($sPostalCode, 'postalcode', 5, 11, array(5, 11)); $this->loadStructuredAddressElement($sCountry, 'country', 4, 4, false); if (!empty($this->aStructuredQuery)) { $this->sQuery = join(', ', $this->aStructuredQuery); if ($this->iMaxAddressRank < 30) { $this->sAllowedTypesSQLList = '(\'place\',\'boundary\')'; } } } public function fallbackStructuredQuery() { $aParams = $this->aStructuredQuery; if (!$aParams || count($aParams) == 1) { return false; } $aOrderToFallback = array('postalcode', 'street', 'city', 'county', 'state'); foreach ($aOrderToFallback as $sType) { if (isset($aParams[$sType])) { unset($aParams[$sType]); $this->setStructuredQuery(@$aParams['amenity'], @$aParams['street'], @$aParams['city'], @$aParams['county'], @$aParams['state'], @$aParams['country'], @$aParams['postalcode']); return true; } } return false; } public function getGroupedSearches($aSearches, $aPhrases, $oValidTokens) { /* Calculate all searches using oValidTokens i.e. 'Wodsworth Road, Sheffield' => Phrase Wordset 0 0 (wodsworth road) 0 1 (wodsworth)(road) 1 0 (sheffield) Score how good the search is so they can be ordered */ foreach ($aPhrases as $iPhrase => $oPhrase) { $aNewPhraseSearches = array(); $oPosition = new SearchPosition( $oPhrase->getPhraseType(), $iPhrase, count($aPhrases) ); foreach ($oPhrase->getWordSets() as $aWordset) { $aWordsetSearches = $aSearches; // Add all words from this wordset foreach ($aWordset as $iToken => $sToken) { $aNewWordsetSearches = array(); $oPosition->setTokenPosition($iToken, count($aWordset)); foreach ($aWordsetSearches as $oCurrentSearch) { foreach ($oValidTokens->get($sToken) as $oSearchTerm) { if ($oSearchTerm->isExtendable($oCurrentSearch, $oPosition)) { $aNewSearches = $oSearchTerm->extendSearch( $oCurrentSearch, $oPosition ); foreach ($aNewSearches as $oSearch) { if ($oSearch->getRank() < $this->iMaxRank) { $aNewWordsetSearches[] = $oSearch; } } } } } // Sort and cut usort($aNewWordsetSearches, array('Nominatim\SearchDescription', 'bySearchRank')); $aWordsetSearches = array_slice($aNewWordsetSearches, 0, 50); } $aNewPhraseSearches = array_merge($aNewPhraseSearches, $aNewWordsetSearches); usort($aNewPhraseSearches, array('Nominatim\SearchDescription', 'bySearchRank')); $aSearchHash = array(); foreach ($aNewPhraseSearches as $iSearch => $aSearch) { $sHash = serialize($aSearch); if (isset($aSearchHash[$sHash])) { unset($aNewPhraseSearches[$iSearch]); } else { $aSearchHash[$sHash] = 1; } } $aNewPhraseSearches = array_slice($aNewPhraseSearches, 0, 50); } // Re-group the searches by their score, junk anything over 20 as just not worth trying $aGroupedSearches = array(); foreach ($aNewPhraseSearches as $aSearch) { $iRank = $aSearch->getRank(); if ($iRank < $this->iMaxRank) { if (!isset($aGroupedSearches[$iRank])) { $aGroupedSearches[$iRank] = array(); } $aGroupedSearches[$iRank][] = $aSearch; } } ksort($aGroupedSearches); $iSearchCount = 0; $aSearches = array(); foreach ($aGroupedSearches as $aNewSearches) { $iSearchCount += count($aNewSearches); $aSearches = array_merge($aSearches, $aNewSearches); if ($iSearchCount > 50) { break; } } } // Revisit searches, drop bad searches and give penalty to unlikely combinations. $aGroupedSearches = array(); foreach ($aSearches as $oSearch) { if (!$oSearch->isValidSearch()) { continue; } $iRank = $oSearch->getRank(); if (!isset($aGroupedSearches[$iRank])) { $aGroupedSearches[$iRank] = array(); } $aGroupedSearches[$iRank][] = $oSearch; } ksort($aGroupedSearches); return $aGroupedSearches; } /* Perform the actual query lookup. Returns an ordered list of results, each with the following fields: osm_type: type of corresponding OSM object N - node W - way R - relation P - postcode (internally computed) osm_id: id of corresponding OSM object class: general object class (corresponds to tag key of primary OSM tag) type: subclass of object (corresponds to tag value of primary OSM tag) admin_level: see https://wiki.openstreetmap.org/wiki/Admin_level rank_search: rank in search hierarchy (see also https://wiki.openstreetmap.org/wiki/Nominatim/Development_overview#Country_to_street_level) rank_address: rank in address hierarchy (determines orer in address) place_id: internal key (may differ between different instances) country_code: ISO country code langaddress: localized full address placename: localized name of object ref: content of ref tag (if available) lon: longitude lat: latitude importance: importance of place based on Wikipedia link count addressimportance: cumulated importance of address elements extra_place: type of place (for admin boundaries, if there is a place tag) aBoundingBox: bounding Box label: short description of the object class/type (English only) name: full name (currently the same as langaddress) foundorder: secondary ordering for places with same importance */ public function lookup() { Debug::newFunction('Geocode::lookup'); if (!$this->sQuery && !$this->aStructuredQuery) { return array(); } Debug::printDebugArray('Geocode', $this); $oCtx = new SearchContext(); if ($this->aRoutePoints) { $oCtx->setViewboxFromRoute( $this->oDB, $this->aRoutePoints, $this->aRouteWidth, $this->bBoundedSearch ); } elseif ($this->aViewBox) { $oCtx->setViewboxFromBox($this->aViewBox, $this->bBoundedSearch); } if ($this->aExcludePlaceIDs) { $oCtx->setExcludeList($this->aExcludePlaceIDs); } if ($this->aCountryCodes) { $oCtx->setCountryList($this->aCountryCodes); } Debug::newSection('Query Preprocessing'); $sQuery = $this->sQuery; if (!preg_match('//u', $sQuery)) { userError('Query string is not UTF-8 encoded.'); } // Conflicts between US state abreviations and various words for 'the' in different languages if (isset($this->aLangPrefOrder['name:en'])) { $sQuery = preg_replace('/(^|,)\s*il\s*(,|$)/i', '\1illinois\2', $sQuery); $sQuery = preg_replace('/(^|,)\s*al\s*(,|$)/i', '\1alabama\2', $sQuery); $sQuery = preg_replace('/(^|,)\s*la\s*(,|$)/i', '\1louisiana\2', $sQuery); } // Do we have anything that looks like a lat/lon pair? $sQuery = $oCtx->setNearPointFromQuery($sQuery); if ($sQuery || $this->aStructuredQuery) { // Start with a single blank search $aSearches = array(new SearchDescription($oCtx)); if ($sQuery) { $sQuery = $aSearches[0]->extractKeyValuePairs($sQuery); } $sSpecialTerm = ''; if ($sQuery) { preg_match_all( '/\\[([\\w ]*)\\]/u', $sQuery, $aSpecialTermsRaw, PREG_SET_ORDER ); if (!empty($aSpecialTermsRaw)) { Debug::printVar('Special terms', $aSpecialTermsRaw); } foreach ($aSpecialTermsRaw as $aSpecialTerm) { $sQuery = str_replace($aSpecialTerm[0], ' ', $sQuery); if (!$sSpecialTerm) { $sSpecialTerm = $aSpecialTerm[1]; } } } if (!$sSpecialTerm && $this->aStructuredQuery && isset($this->aStructuredQuery['amenity'])) { $sSpecialTerm = $this->aStructuredQuery['amenity']; unset($this->aStructuredQuery['amenity']); } if ($sSpecialTerm && !$aSearches[0]->hasOperator()) { $aTokens = $this->oTokenizer->tokensForSpecialTerm($sSpecialTerm); if (!empty($aTokens)) { $aNewSearches = array(); $oPosition = new SearchPosition('', 0, 1); $oPosition->setTokenPosition(0, 1); foreach ($aSearches as $oSearch) { foreach ($aTokens as $oToken) { $aNewSearches = array_merge( $aNewSearches, $oToken->extendSearch($oSearch, $oPosition) ); } } $aSearches = $aNewSearches; } } // Split query into phrases // Commas are used to reduce the search space by indicating where phrases split $aPhrases = array(); if ($this->aStructuredQuery) { foreach ($this->aStructuredQuery as $iPhrase => $sPhrase) { $aPhrases[] = new Phrase($sPhrase, $iPhrase); } } else { foreach (explode(',', $sQuery) as $sPhrase) { $aPhrases[] = new Phrase($sPhrase, ''); } } Debug::printDebugArray('Search context', $oCtx); Debug::printDebugArray('Base search', empty($aSearches) ? null : $aSearches[0]); Debug::newSection('Tokenization'); $oValidTokens = $this->oTokenizer->extractTokensFromPhrases($aPhrases); if ($oValidTokens->count() > 0) { $oCtx->setFullNameWords($oValidTokens->getFullWordIDs()); $aPhrases = array_filter($aPhrases, function ($oPhrase) { return $oPhrase->getWordSets() !== null; }); // Any words that have failed completely? // TODO: suggestions Debug::printGroupTable('Valid Tokens', $oValidTokens->debugInfo()); Debug::printDebugTable('Phrases', $aPhrases); Debug::newSection('Search candidates'); $aGroupedSearches = $this->getGroupedSearches($aSearches, $aPhrases, $oValidTokens); if (!$this->aStructuredQuery) { // Reverse phrase array and also reverse the order of the wordsets in // the first and final phrase. Don't bother about phrases in the middle // because order in the address doesn't matter. $aPhrases = array_reverse($aPhrases); $aPhrases[0]->invertWordSets(); if (count($aPhrases) > 1) { $aPhrases[count($aPhrases)-1]->invertWordSets(); } $aReverseGroupedSearches = $this->getGroupedSearches($aSearches, $aPhrases, $oValidTokens); foreach ($aGroupedSearches as $aSearches) { foreach ($aSearches as $aSearch) { if (!isset($aReverseGroupedSearches[$aSearch->getRank()])) { $aReverseGroupedSearches[$aSearch->getRank()] = array(); } $aReverseGroupedSearches[$aSearch->getRank()][] = $aSearch; } } $aGroupedSearches = $aReverseGroupedSearches; ksort($aGroupedSearches); } } else { // Re-group the searches by their score, junk anything over 20 as just not worth trying $aGroupedSearches = array(); foreach ($aSearches as $aSearch) { if ($aSearch->getRank() < $this->iMaxRank) { if (!isset($aGroupedSearches[$aSearch->getRank()])) { $aGroupedSearches[$aSearch->getRank()] = array(); } $aGroupedSearches[$aSearch->getRank()][] = $aSearch; } } ksort($aGroupedSearches); } // Filter out duplicate searches $aSearchHash = array(); foreach ($aGroupedSearches as $iGroup => $aSearches) { foreach ($aSearches as $iSearch => $aSearch) { $sHash = serialize($aSearch); if (isset($aSearchHash[$sHash])) { unset($aGroupedSearches[$iGroup][$iSearch]); if (empty($aGroupedSearches[$iGroup])) { unset($aGroupedSearches[$iGroup]); } } else { $aSearchHash[$sHash] = 1; } } } Debug::printGroupedSearch( $aGroupedSearches, $oValidTokens->debugTokenByWordIdList() ); // Start the search process $iGroupLoop = 0; $iQueryLoop = 0; $aNextResults = array(); foreach ($aGroupedSearches as $iGroupedRank => $aSearches) { $iGroupLoop++; $aResults = $aNextResults; foreach ($aSearches as $oSearch) { $iQueryLoop++; Debug::newSection("Search Loop, group $iGroupLoop, loop $iQueryLoop"); Debug::printGroupedSearch( array($iGroupedRank => array($oSearch)), $oValidTokens->debugTokenByWordIdList() ); $aNewResults = $oSearch->query( $this->oDB, $this->iMinAddressRank, $this->iMaxAddressRank, $this->iLimit ); // The same result may appear in different rounds, only // use the one with minimal rank. foreach ($aNewResults as $iPlace => $oRes) { if (!isset($aResults[$iPlace]) || $aResults[$iPlace]->iResultRank > $oRes->iResultRank) { $aResults[$iPlace] = $oRes; } } if ($iQueryLoop > 20) { break; } } if (!empty($aResults)) { $aSplitResults = Result::splitResults($aResults); Debug::printVar('Split results', $aSplitResults); if ($iGroupLoop <= 4 && reset($aSplitResults['head'])->iResultRank > 0 && $iGroupedRank !== array_key_last($aGroupedSearches)) { // Haven't found an exact match for the query yet. // Therefore add result from the next group level. $aNextResults = $aSplitResults['head']; foreach ($aNextResults as $oRes) { $oRes->iResultRank--; } foreach ($aSplitResults['tail'] as $oRes) { $oRes->iResultRank--; $aNextResults[$oRes->iId] = $oRes; } $aResults = array(); } else { $aResults = $aSplitResults['head']; } } if (!empty($aResults) && ($this->iMinAddressRank != 0 || $this->iMaxAddressRank != 30)) { // Need to verify passes rank limits before dropping out of the loop (yuk!) // reduces the number of place ids, like a filter // rank_address is 30 for interpolated housenumbers $aFilterSql = array(); $sPlaceIds = Result::joinIdsByTable($aResults, Result::TABLE_PLACEX); if ($sPlaceIds) { $sSQL = 'SELECT place_id FROM placex '; $sSQL .= 'WHERE place_id in ('.$sPlaceIds.') '; $sSQL .= ' AND ('; $sSQL .= " placex.rank_address between $this->iMinAddressRank and $this->iMaxAddressRank "; $sSQL .= " OR placex.rank_search between $this->iMinAddressRank and $this->iMaxAddressRank "; if ($this->aAddressRankList) { $sSQL .= ' OR placex.rank_address in ('.join(',', $this->aAddressRankList).')'; } $sSQL .= ')'; $aFilterSql[] = $sSQL; } $sPlaceIds = Result::joinIdsByTable($aResults, Result::TABLE_POSTCODE); if ($sPlaceIds) { $sSQL = ' SELECT place_id FROM location_postcode lp '; $sSQL .= 'WHERE place_id in ('.$sPlaceIds.') '; $sSQL .= " AND (lp.rank_address between $this->iMinAddressRank and $this->iMaxAddressRank "; if ($this->aAddressRankList) { $sSQL .= ' OR lp.rank_address in ('.join(',', $this->aAddressRankList).')'; } $sSQL .= ') '; $aFilterSql[] = $sSQL; } $aFilteredIDs = array(); if ($aFilterSql) { $sSQL = join(' UNION ', $aFilterSql); Debug::printSQL($sSQL); $aFilteredIDs = $this->oDB->getCol($sSQL); } $tempIDs = array(); foreach ($aResults as $oResult) { if (($this->iMaxAddressRank == 30 && ($oResult->iTable == Result::TABLE_OSMLINE || $oResult->iTable == Result::TABLE_TIGER)) || in_array($oResult->iId, $aFilteredIDs) ) { $tempIDs[$oResult->iId] = $oResult; } } $aResults = $tempIDs; } if (!empty($aResults) || $iGroupLoop > 4 || $iQueryLoop > 30) { break; } } } else { // Just interpret as a reverse geocode $oReverse = new ReverseGeocode($this->oDB); $oReverse->setZoom(18); $oLookup = $oReverse->lookupPoint($oCtx->sqlNear, false); Debug::printVar('Reverse search', $oLookup); if ($oLookup) { $aResults = array($oLookup->iId => $oLookup); } } // No results? Done if (empty($aResults)) { if ($this->bFallback && $this->fallbackStructuredQuery()) { return $this->lookup(); } return array(); } if ($this->aAddressRankList) { $this->oPlaceLookup->setAddressRankList($this->aAddressRankList); } $this->oPlaceLookup->setAllowedTypesSQLList($this->sAllowedTypesSQLList); $this->oPlaceLookup->setLanguagePreference($this->aLangPrefOrder); if ($oCtx->hasNearPoint()) { $this->oPlaceLookup->setAnchorSql($oCtx->sqlNear); } $aSearchResults = $this->oPlaceLookup->lookup($aResults); $aRecheckWords = preg_split('/\b[\s,\\-]*/u', $sQuery); foreach ($aRecheckWords as $i => $sWord) { if (!preg_match('/[\pL\pN]/', $sWord)) { unset($aRecheckWords[$i]); } } Debug::printVar('Recheck words', $aRecheckWords); foreach ($aSearchResults as $iIdx => $aResult) { $fRadius = ClassTypes\getDefRadius($aResult); $aOutlineResult = $this->oPlaceLookup->getOutlines($aResult['place_id'], $aResult['lon'], $aResult['lat'], $fRadius); if ($aOutlineResult) { $aResult = array_merge($aResult, $aOutlineResult); } // Is there an icon set for this type of result? $sIcon = ClassTypes\getIconFile($aResult); if (isset($sIcon)) { $aResult['icon'] = $sIcon; } $sLabel = ClassTypes\getLabel($aResult); if (isset($sLabel)) { $aResult['label'] = $sLabel; } $aResult['name'] = $aResult['langaddress']; if ($oCtx->hasNearPoint()) { $aResult['importance'] = 0.001; $aResult['foundorder'] = $aResult['addressimportance']; } else { $aResult['importance'] = max(0.001, $aResult['importance']); $aResult['importance'] *= $this->viewboxImportanceFactor( $aResult['lon'], $aResult['lat'] ); // secondary ordering (for results with same importance (the smaller the better): // - approximate importance of address parts if (isset($aResult['addressimportance']) && $aResult['addressimportance']) { $aResult['foundorder'] = -$aResult['addressimportance']/10; } else { $aResult['foundorder'] = -$aResult['importance']; } // - number of exact matches from the query $aResult['foundorder'] -= $aResults[$aResult['place_id']]->iExactMatches; // - importance of the class/type $iClassImportance = ClassTypes\getImportance($aResult); if (isset($iClassImportance)) { $aResult['foundorder'] += 0.0001 * $iClassImportance; } else { $aResult['foundorder'] += 0.01; } // - rank $aResult['foundorder'] -= 0.00001 * (30 - $aResult['rank_search']); // Adjust importance for the number of exact string matches in the result $iCountWords = 0; $sAddress = $aResult['langaddress']; foreach ($aRecheckWords as $i => $sWord) { if (stripos($sAddress, $sWord)!==false) { $iCountWords++; if (preg_match('/(^|,)\s*'.preg_quote($sWord, '/').'\s*(,|$)/', $sAddress)) { $iCountWords += 0.1; } } } // 0.1 is a completely arbitrary number but something in the range 0.1 to 0.5 would seem right $aResult['importance'] = $aResult['importance'] + ($iCountWords*0.1); } $aSearchResults[$iIdx] = $aResult; } uasort($aSearchResults, 'byImportance'); Debug::printVar('Pre-filter results', $aSearchResults); $aOSMIDDone = array(); $aClassTypeNameDone = array(); $aToFilter = $aSearchResults; $aSearchResults = array(); foreach ($aToFilter as $aResult) { $this->aExcludePlaceIDs[$aResult['place_id']] = $aResult['place_id']; if (!$this->oPlaceLookup->doDeDupe() || (!isset($aOSMIDDone[$aResult['osm_type'].$aResult['osm_id']]) && !isset($aClassTypeNameDone[$aResult['osm_type'].$aResult['class'].$aResult['type'].$aResult['name'].$aResult['admin_level']])) ) { $aOSMIDDone[$aResult['osm_type'].$aResult['osm_id']] = true; $aClassTypeNameDone[$aResult['osm_type'].$aResult['class'].$aResult['type'].$aResult['name'].$aResult['admin_level']] = true; $aSearchResults[] = $aResult; } // Absolute limit on number of results if (count($aSearchResults) >= $this->iFinalLimit) { break; } } Debug::printVar('Post-filter results', $aSearchResults); return $aSearchResults; } // end lookup() public function debugInfo() { return array( 'Query' => $this->sQuery, 'Structured query' => $this->aStructuredQuery, 'Name keys' => Debug::fmtArrayVals($this->aLangPrefOrder), 'Excluded place IDs' => Debug::fmtArrayVals($this->aExcludePlaceIDs), 'Limit (for searches)' => $this->iLimit, 'Limit (for results)'=> $this->iFinalLimit, 'Country codes' => Debug::fmtArrayVals($this->aCountryCodes), 'Bounded search' => $this->bBoundedSearch, 'Viewbox' => Debug::fmtArrayVals($this->aViewBox), 'Route points' => Debug::fmtArrayVals($this->aRoutePoints), 'Route width' => $this->aRouteWidth, 'Max rank' => $this->iMaxRank, 'Min address rank' => $this->iMinAddressRank, 'Max address rank' => $this->iMaxAddressRank, 'Address rank list' => Debug::fmtArrayVals($this->aAddressRankList) ); } } // end class