]> git.openstreetmap.org Git - nominatim.git/blob - lib/Geocode.php
652434cca93ac23d767409418c2f020f0b81124b
[nominatim.git] / lib / Geocode.php
1 <?php
2
3 namespace Nominatim;
4
5 require_once(CONST_BasePath.'/lib/NearPoint.php');
6 require_once(CONST_BasePath.'/lib/PlaceLookup.php');
7 require_once(CONST_BasePath.'/lib/ReverseGeocode.php');
8
9 class Geocode
10 {
11     protected $oDB;
12
13     protected $aLangPrefOrder = array();
14
15     protected $bIncludeAddressDetails = false;
16     protected $bIncludeExtraTags = false;
17     protected $bIncludeNameDetails = false;
18
19     protected $bIncludePolygonAsPoints = false;
20     protected $bIncludePolygonAsText = false;
21     protected $bIncludePolygonAsGeoJSON = false;
22     protected $bIncludePolygonAsKML = false;
23     protected $bIncludePolygonAsSVG = false;
24     protected $fPolygonSimplificationThreshold = 0.0;
25
26     protected $aExcludePlaceIDs = array();
27     protected $bDeDupe = true;
28     protected $bReverseInPlan = false;
29
30     protected $iLimit = 20;
31     protected $iFinalLimit = 10;
32     protected $iOffset = 0;
33     protected $bFallback = false;
34
35     protected $aCountryCodes = false;
36
37     protected $bBoundedSearch = false;
38     protected $aViewBox = false;
39     protected $sViewboxCentreSQL = false;
40     protected $sViewboxSmallSQL = false;
41     protected $sViewboxLargeSQL = false;
42
43     protected $iMaxRank = 20;
44     protected $iMinAddressRank = 0;
45     protected $iMaxAddressRank = 30;
46     protected $aAddressRankList = array();
47     protected $exactMatchCache = array();
48
49     protected $sAllowedTypesSQLList = false;
50
51     protected $sQuery = false;
52     protected $aStructuredQuery = false;
53
54     protected $oNormalizer = null;
55
56
57     public function __construct(&$oDB)
58     {
59         $this->oDB =& $oDB;
60         $this->oNormalizer = \Transliterator::createFromRules(CONST_Term_Normalization_Rules);
61     }
62
63     private function normTerm($sTerm)
64     {
65         if ($this->oNormalizer === null) {
66             return $sTerm;
67         }
68
69         return $this->oNormalizer->transliterate($sTerm);
70     }
71
72     public function setReverseInPlan($bReverse)
73     {
74         $this->bReverseInPlan = $bReverse;
75     }
76
77     public function setLanguagePreference($aLangPref)
78     {
79         $this->aLangPrefOrder = $aLangPref;
80     }
81
82     public function getMoreUrlParams()
83     {
84         if ($this->aStructuredQuery) {
85             $aParams = $this->aStructuredQuery;
86         } else {
87             $aParams = array('q' => $this->sQuery);
88         }
89
90         if ($this->aExcludePlaceIDs) {
91             $aParams['exclude_place_ids'] = implode(',', $this->aExcludePlaceIDs);
92         }
93
94         if ($this->bIncludeAddressDetails) $aParams['addressdetails'] = '1';
95         if ($this->bIncludeExtraTags) $aParams['extratags'] = '1';
96         if ($this->bIncludeNameDetails) $aParams['namedetails'] = '1';
97
98         if ($this->bIncludePolygonAsPoints) $aParams['polygon'] = '1';
99         if ($this->bIncludePolygonAsText) $aParams['polygon_text'] = '1';
100         if ($this->bIncludePolygonAsGeoJSON) $aParams['polygon_geojson'] = '1';
101         if ($this->bIncludePolygonAsKML) $aParams['polygon_kml'] = '1';
102         if ($this->bIncludePolygonAsSVG) $aParams['polygon_svg'] = '1';
103
104         if ($this->fPolygonSimplificationThreshold > 0.0) {
105             $aParams['polygon_threshold'] = $this->fPolygonSimplificationThreshold;
106         }
107
108         if ($this->bBoundedSearch) $aParams['bounded'] = '1';
109         if (!$this->bDeDupe) $aParams['dedupe'] = '0';
110
111         if ($this->aCountryCodes) {
112             $aParams['countrycodes'] = implode(',', $this->aCountryCodes);
113         }
114
115         if ($this->aViewBox) {
116             $aParams['viewbox'] = $this->aViewBox[0].','.$this->aViewBox[3]
117                                   .','.$this->aViewBox[2].','.$this->aViewBox[1];
118         }
119
120         return $aParams;
121     }
122
123     public function setIncludePolygonAsPoints($b = true)
124     {
125         $this->bIncludePolygonAsPoints = $b;
126     }
127
128     public function setIncludePolygonAsText($b = true)
129     {
130         $this->bIncludePolygonAsText = $b;
131     }
132
133     public function setIncludePolygonAsGeoJSON($b = true)
134     {
135         $this->bIncludePolygonAsGeoJSON = $b;
136     }
137
138     public function setIncludePolygonAsKML($b = true)
139     {
140         $this->bIncludePolygonAsKML = $b;
141     }
142
143     public function setIncludePolygonAsSVG($b = true)
144     {
145         $this->bIncludePolygonAsSVG = $b;
146     }
147
148     public function setPolygonSimplificationThreshold($f)
149     {
150         $this->fPolygonSimplificationThreshold = $f;
151     }
152
153     public function setLimit($iLimit = 10)
154     {
155         if ($iLimit > 50) $iLimit = 50;
156         if ($iLimit < 1) $iLimit = 1;
157
158         $this->iFinalLimit = $iLimit;
159         $this->iLimit = $iLimit + min($iLimit, 10);
160     }
161
162     public function setFeatureType($sFeatureType)
163     {
164         switch ($sFeatureType) {
165             case 'country':
166                 $this->setRankRange(4, 4);
167                 break;
168             case 'state':
169                 $this->setRankRange(8, 8);
170                 break;
171             case 'city':
172                 $this->setRankRange(14, 16);
173                 break;
174             case 'settlement':
175                 $this->setRankRange(8, 20);
176                 break;
177         }
178     }
179
180     public function setRankRange($iMin, $iMax)
181     {
182         $this->iMinAddressRank = $iMin;
183         $this->iMaxAddressRank = $iMax;
184     }
185
186     public function setRoute($aRoutePoints, $fRouteWidth)
187     {
188         $this->aViewBox = false;
189
190         $this->sViewboxCentreSQL = "ST_SetSRID('LINESTRING(";
191         $sSep = '';
192         foreach ($aRoutePoints as $aPoint) {
193             $fPoint = (float)$aPoint;
194             $this->sViewboxCentreSQL .= $sSep.$fPoint;
195             $sSep = ($sSep == ' ') ? ',' : ' ';
196         }
197         $this->sViewboxCentreSQL .= ")'::geometry,4326)";
198
199         $this->sViewboxSmallSQL = 'ST_BUFFER('.$this->sViewboxCentreSQL;
200         $this->sViewboxSmallSQL .= ','.($fRouteWidth/69).')';
201
202         $this->sViewboxLargeSQL = 'ST_BUFFER('.$this->sViewboxCentreSQL;
203         $this->sViewboxLargeSQL .= ','.($fRouteWidth/30).')';
204     }
205
206     public function setViewbox($aViewbox)
207     {
208         $this->aViewBox = array_map('floatval', $aViewbox);
209
210         $this->aViewBox[0] = max(-180.0, min(180, $this->aViewBox[0]));
211         $this->aViewBox[1] = max(-90.0, min(90, $this->aViewBox[1]));
212         $this->aViewBox[2] = max(-180.0, min(180, $this->aViewBox[2]));
213         $this->aViewBox[3] = max(-90.0, min(90, $this->aViewBox[3]));
214
215         if (abs($this->aViewBox[0] - $this->aViewBox[2]) < 0.000000001
216             || abs($this->aViewBox[1] - $this->aViewBox[3]) < 0.000000001
217         ) {
218             userError("Bad parameter 'viewbox'. Not a box.");
219         }
220
221         $fHeight = $this->aViewBox[0] - $this->aViewBox[2];
222         $fWidth = $this->aViewBox[1] - $this->aViewBox[3];
223         $aBigViewBox[0] = $this->aViewBox[0] + $fHeight;
224         $aBigViewBox[2] = $this->aViewBox[2] - $fHeight;
225         $aBigViewBox[1] = $this->aViewBox[1] + $fWidth;
226         $aBigViewBox[3] = $this->aViewBox[3] - $fWidth;
227
228         $this->sViewboxCentreSQL = false;
229         $this->sViewboxSmallSQL = sprintf(
230             'ST_SetSRID(ST_MakeBox2D(ST_Point(%F,%F),ST_Point(%F,%F)),4326)',
231             $this->aViewBox[0],
232             $this->aViewBox[1],
233             $this->aViewBox[2],
234             $this->aViewBox[3]
235         );
236         $this->sViewboxLargeSQL = sprintf(
237             'ST_SetSRID(ST_MakeBox2D(ST_Point(%F,%F),ST_Point(%F,%F)),4326)',
238             $aBigViewBox[0],
239             $aBigViewBox[1],
240             $aBigViewBox[2],
241             $aBigViewBox[3]
242         );
243     }
244
245     public function setQuery($sQueryString)
246     {
247         $this->sQuery = $sQueryString;
248         $this->aStructuredQuery = false;
249     }
250
251     public function getQueryString()
252     {
253         return $this->sQuery;
254     }
255
256
257     public function loadParamArray($oParams)
258     {
259         $this->bIncludeAddressDetails
260          = $oParams->getBool('addressdetails', $this->bIncludeAddressDetails);
261         $this->bIncludeExtraTags
262          = $oParams->getBool('extratags', $this->bIncludeExtraTags);
263         $this->bIncludeNameDetails
264          = $oParams->getBool('namedetails', $this->bIncludeNameDetails);
265
266         $this->bBoundedSearch = $oParams->getBool('bounded', $this->bBoundedSearch);
267         $this->bDeDupe = $oParams->getBool('dedupe', $this->bDeDupe);
268
269         $this->setLimit($oParams->getInt('limit', $this->iFinalLimit));
270         $this->iOffset = $oParams->getInt('offset', $this->iOffset);
271
272         $this->bFallback = $oParams->getBool('fallback', $this->bFallback);
273
274         // List of excluded Place IDs - used for more acurate pageing
275         $sExcluded = $oParams->getStringList('exclude_place_ids');
276         if ($sExcluded) {
277             foreach ($sExcluded as $iExcludedPlaceID) {
278                 $iExcludedPlaceID = (int)$iExcludedPlaceID;
279                 if ($iExcludedPlaceID)
280                     $aExcludePlaceIDs[$iExcludedPlaceID] = $iExcludedPlaceID;
281             }
282
283             if (isset($aExcludePlaceIDs))
284                 $this->aExcludePlaceIDs = $aExcludePlaceIDs;
285         }
286
287         // Only certain ranks of feature
288         $sFeatureType = $oParams->getString('featureType');
289         if (!$sFeatureType) $sFeatureType = $oParams->getString('featuretype');
290         if ($sFeatureType) $this->setFeatureType($sFeatureType);
291
292         // Country code list
293         $sCountries = $oParams->getStringList('countrycodes');
294         if ($sCountries) {
295             foreach ($sCountries as $sCountryCode) {
296                 if (preg_match('/^[a-zA-Z][a-zA-Z]$/', $sCountryCode)) {
297                     $aCountries[] = strtolower($sCountryCode);
298                 }
299             }
300             if (isset($aCountries))
301                 $this->aCountryCodes = $aCountries;
302         }
303
304         $aViewbox = $oParams->getStringList('viewboxlbrt');
305         if ($aViewbox) {
306             if (count($aViewbox) != 4) {
307                 userError("Bad parmater 'viewboxlbrt'. Expected 4 coordinates.");
308             }
309             $this->setViewbox($aViewbox);
310         } else {
311             $aViewbox = $oParams->getStringList('viewbox');
312             if ($aViewbox) {
313                 if (count($aViewbox) != 4) {
314                     userError("Bad parmater 'viewbox'. Expected 4 coordinates.");
315                 }
316                 $this->setViewBox($aViewbox);
317             } else {
318                 $aRoute = $oParams->getStringList('route');
319                 $fRouteWidth = $oParams->getFloat('routewidth');
320                 if ($aRoute && $fRouteWidth) {
321                     $this->setRoute($aRoute, $fRouteWidth);
322                 }
323             }
324         }
325     }
326
327     public function setQueryFromParams($oParams)
328     {
329         // Search query
330         $sQuery = $oParams->getString('q');
331         if (!$sQuery) {
332             $this->setStructuredQuery(
333                 $oParams->getString('amenity'),
334                 $oParams->getString('street'),
335                 $oParams->getString('city'),
336                 $oParams->getString('county'),
337                 $oParams->getString('state'),
338                 $oParams->getString('country'),
339                 $oParams->getString('postalcode')
340             );
341             $this->setReverseInPlan(false);
342         } else {
343             $this->setQuery($sQuery);
344         }
345     }
346
347     public function loadStructuredAddressElement($sValue, $sKey, $iNewMinAddressRank, $iNewMaxAddressRank, $aItemListValues)
348     {
349         $sValue = trim($sValue);
350         if (!$sValue) return false;
351         $this->aStructuredQuery[$sKey] = $sValue;
352         if ($this->iMinAddressRank == 0 && $this->iMaxAddressRank == 30) {
353             $this->iMinAddressRank = $iNewMinAddressRank;
354             $this->iMaxAddressRank = $iNewMaxAddressRank;
355         }
356         if ($aItemListValues) $this->aAddressRankList = array_merge($this->aAddressRankList, $aItemListValues);
357         return true;
358     }
359
360     public function setStructuredQuery($sAmenity = false, $sStreet = false, $sCity = false, $sCounty = false, $sState = false, $sCountry = false, $sPostalCode = false)
361     {
362         $this->sQuery = false;
363
364         // Reset
365         $this->iMinAddressRank = 0;
366         $this->iMaxAddressRank = 30;
367         $this->aAddressRankList = array();
368
369         $this->aStructuredQuery = array();
370         $this->sAllowedTypesSQLList = False;
371
372         $this->loadStructuredAddressElement($sAmenity, 'amenity', 26, 30, false);
373         $this->loadStructuredAddressElement($sStreet, 'street', 26, 30, false);
374         $this->loadStructuredAddressElement($sCity, 'city', 14, 24, false);
375         $this->loadStructuredAddressElement($sCounty, 'county', 9, 13, false);
376         $this->loadStructuredAddressElement($sState, 'state', 8, 8, false);
377         $this->loadStructuredAddressElement($sPostalCode, 'postalcode', 5, 11, array(5, 11));
378         $this->loadStructuredAddressElement($sCountry, 'country', 4, 4, false);
379
380         if (sizeof($this->aStructuredQuery) > 0) {
381             $this->sQuery = join(', ', $this->aStructuredQuery);
382             if ($this->iMaxAddressRank < 30) {
383                 $this->sAllowedTypesSQLList = '(\'place\',\'boundary\')';
384             }
385         }
386     }
387
388     public function fallbackStructuredQuery()
389     {
390         if (!$this->aStructuredQuery) return false;
391
392         $aParams = $this->aStructuredQuery;
393
394         if (sizeof($aParams) == 1) return false;
395
396         $aOrderToFallback = array('postalcode', 'street', 'city', 'county', 'state');
397
398         foreach ($aOrderToFallback as $sType) {
399             if (isset($aParams[$sType])) {
400                 unset($aParams[$sType]);
401                 $this->setStructuredQuery(@$aParams['amenity'], @$aParams['street'], @$aParams['city'], @$aParams['county'], @$aParams['state'], @$aParams['country'], @$aParams['postalcode']);
402                 return true;
403             }
404         }
405
406         return false;
407     }
408
409     public function getDetails($aPlaceIDs)
410     {
411         //$aPlaceIDs is an array with key: placeID and value: tiger-housenumber, if found, else -1
412         if (sizeof($aPlaceIDs) == 0) return array();
413
414         $sLanguagePrefArraySQL = "ARRAY[".join(',', array_map("getDBQuoted", $this->aLangPrefOrder))."]";
415
416         // Get the details for display (is this a redundant extra step?)
417         $sPlaceIDs = join(',', array_keys($aPlaceIDs));
418
419         $sImportanceSQL = '';
420         $sImportanceSQLGeom = '';
421         if ($this->sViewboxSmallSQL) {
422             $sImportanceSQL .= " CASE WHEN ST_Contains($this->sViewboxSmallSQL, ST_Collect(centroid)) THEN 1 ELSE 0.75 END * ";
423             $sImportanceSQLGeom .= " CASE WHEN ST_Contains($this->sViewboxSmallSQL, geometry) THEN 1 ELSE 0.75 END * ";
424         }
425         if ($this->sViewboxLargeSQL) {
426             $sImportanceSQL .= " CASE WHEN ST_Contains($this->sViewboxLargeSQL, ST_Collect(centroid)) THEN 1 ELSE 0.75 END * ";
427             $sImportanceSQLGeom .= " CASE WHEN ST_Contains($this->sViewboxLargeSQL, geometry) THEN 1 ELSE 0.75 END * ";
428         }
429
430         $sSQL  = "SELECT ";
431         $sSQL .= "    osm_type,";
432         $sSQL .= "    osm_id,";
433         $sSQL .= "    class,";
434         $sSQL .= "    type,";
435         $sSQL .= "    admin_level,";
436         $sSQL .= "    rank_search,";
437         $sSQL .= "    rank_address,";
438         $sSQL .= "    min(place_id) AS place_id, ";
439         $sSQL .= "    min(parent_place_id) AS parent_place_id, ";
440         $sSQL .= "    country_code, ";
441         $sSQL .= "    get_address_by_language(place_id, -1, $sLanguagePrefArraySQL) AS langaddress,";
442         $sSQL .= "    get_name_by_language(name, $sLanguagePrefArraySQL) AS placename,";
443         $sSQL .= "    get_name_by_language(name, ARRAY['ref']) AS ref,";
444         if ($this->bIncludeExtraTags) $sSQL .= "hstore_to_json(extratags)::text AS extra,";
445         if ($this->bIncludeNameDetails) $sSQL .= "hstore_to_json(name)::text AS names,";
446         $sSQL .= "    avg(ST_X(centroid)) AS lon, ";
447         $sSQL .= "    avg(ST_Y(centroid)) AS lat, ";
448         $sSQL .= "    ".$sImportanceSQL."COALESCE(importance,0.75-(rank_search::float/40)) AS importance, ";
449         $sSQL .= "    ( ";
450         $sSQL .= "       SELECT max(p.importance*(p.rank_address+2))";
451         $sSQL .= "       FROM ";
452         $sSQL .= "         place_addressline s, ";
453         $sSQL .= "         placex p";
454         $sSQL .= "       WHERE s.place_id = min(CASE WHEN placex.rank_search < 28 THEN placex.place_id ELSE placex.parent_place_id END)";
455         $sSQL .= "         AND p.place_id = s.address_place_id ";
456         $sSQL .= "         AND s.isaddress ";
457         $sSQL .= "         AND p.importance is not null ";
458         $sSQL .= "    ) AS addressimportance, ";
459         $sSQL .= "    (extratags->'place') AS extra_place ";
460         $sSQL .= " FROM placex";
461         $sSQL .= " WHERE place_id in ($sPlaceIDs) ";
462         $sSQL .= "   AND (";
463         $sSQL .= "            placex.rank_address between $this->iMinAddressRank and $this->iMaxAddressRank ";
464         if (14 >= $this->iMinAddressRank && 14 <= $this->iMaxAddressRank) {
465             $sSQL .= "        OR (extratags->'place') = 'city'";
466         }
467         if ($this->aAddressRankList) {
468             $sSQL .= "        OR placex.rank_address in (".join(',', $this->aAddressRankList).")";
469         }
470         $sSQL .= "       ) ";
471         if ($this->sAllowedTypesSQLList) {
472             $sSQL .= "AND placex.class in $this->sAllowedTypesSQLList ";
473         }
474         $sSQL .= "    AND linked_place_id is null ";
475         $sSQL .= " GROUP BY ";
476         $sSQL .= "     osm_type, ";
477         $sSQL .= "     osm_id, ";
478         $sSQL .= "     class, ";
479         $sSQL .= "     type, ";
480         $sSQL .= "     admin_level, ";
481         $sSQL .= "     rank_search, ";
482         $sSQL .= "     rank_address, ";
483         $sSQL .= "     country_code, ";
484         $sSQL .= "     importance, ";
485         if (!$this->bDeDupe) $sSQL .= "place_id,";
486         $sSQL .= "     langaddress, ";
487         $sSQL .= "     placename, ";
488         $sSQL .= "     ref, ";
489         if ($this->bIncludeExtraTags) $sSQL .= "extratags, ";
490         if ($this->bIncludeNameDetails) $sSQL .= "name, ";
491         $sSQL .= "     extratags->'place' ";
492
493         // postcode table
494         $sSQL .= "UNION ";
495         $sSQL .= "SELECT";
496         $sSQL .= "  'P' as osm_type,";
497         $sSQL .= "  (SELECT osm_id from placex p WHERE p.place_id = lp.parent_place_id) as osm_id,";
498         $sSQL .= "  'place' as class, 'postcode' as type,";
499         $sSQL .= "  null as admin_level, rank_search, rank_address,";
500         $sSQL .= "  place_id, parent_place_id, country_code,";
501         $sSQL .= "  get_address_by_language(place_id, -1, $sLanguagePrefArraySQL) AS langaddress,";
502         $sSQL .= "  postcode as placename,";
503         $sSQL .= "  postcode as ref,";
504         if ($this->bIncludeExtraTags) $sSQL .= "null AS extra,";
505         if ($this->bIncludeNameDetails) $sSQL .= "null AS names,";
506         $sSQL .= "  ST_x(st_centroid(geometry)) AS lon, ST_y(st_centroid(geometry)) AS lat,";
507         $sSQL .=    $sImportanceSQLGeom."(0.75-(rank_search::float/40)) AS importance, ";
508         $sSQL .= "  (";
509         $sSQL .= "     SELECT max(p.importance*(p.rank_address+2))";
510         $sSQL .= "     FROM ";
511         $sSQL .= "       place_addressline s, ";
512         $sSQL .= "       placex p";
513         $sSQL .= "     WHERE s.place_id = lp.parent_place_id";
514         $sSQL .= "       AND p.place_id = s.address_place_id ";
515         $sSQL .= "       AND s.isaddress";
516         $sSQL .= "       AND p.importance is not null";
517         $sSQL .= "  ) AS addressimportance, ";
518         $sSQL .= "  null AS extra_place ";
519         $sSQL .= "FROM location_postcode lp";
520         $sSQL .= " WHERE place_id in ($sPlaceIDs) ";
521
522         if (30 >= $this->iMinAddressRank && 30 <= $this->iMaxAddressRank) {
523             // only Tiger housenumbers and interpolation lines need to be interpolated, because they are saved as lines
524             // with start- and endnumber, the common osm housenumbers are usually saved as points
525             $sHousenumbers = "";
526             $i = 0;
527             $length = count($aPlaceIDs);
528             foreach ($aPlaceIDs as $placeID => $housenumber) {
529                 $i++;
530                 $sHousenumbers .= "(".$placeID.", ".$housenumber.")";
531                 if ($i<$length) $sHousenumbers .= ", ";
532             }
533
534             if (CONST_Use_US_Tiger_Data) {
535                 // Tiger search only if a housenumber was searched and if it was found (i.e. aPlaceIDs[placeID] = housenumber != -1) (realized through a join)
536                 $sSQL .= " union";
537                 $sSQL .= " SELECT ";
538                 $sSQL .= "     'T' AS osm_type, ";
539                 $sSQL .= "     (SELECT osm_id from placex p WHERE p.place_id=min(blub.parent_place_id)) as osm_id, ";
540                 $sSQL .= "     'place' AS class, ";
541                 $sSQL .= "     'house' AS type, ";
542                 $sSQL .= "     null AS admin_level, ";
543                 $sSQL .= "     30 AS rank_search, ";
544                 $sSQL .= "     30 AS rank_address, ";
545                 $sSQL .= "     min(place_id) AS place_id, ";
546                 $sSQL .= "     min(parent_place_id) AS parent_place_id, ";
547                 $sSQL .= "     'us' AS country_code, ";
548                 $sSQL .= "     get_address_by_language(place_id, housenumber_for_place, $sLanguagePrefArraySQL) AS langaddress,";
549                 $sSQL .= "     null AS placename, ";
550                 $sSQL .= "     null AS ref, ";
551                 if ($this->bIncludeExtraTags) $sSQL .= "null AS extra,";
552                 if ($this->bIncludeNameDetails) $sSQL .= "null AS names,";
553                 $sSQL .= "     avg(st_x(centroid)) AS lon, ";
554                 $sSQL .= "     avg(st_y(centroid)) AS lat,";
555                 $sSQL .= "     ".$sImportanceSQL."-1.15 AS importance, ";
556                 $sSQL .= "     (";
557                 $sSQL .= "        SELECT max(p.importance*(p.rank_address+2))";
558                 $sSQL .= "        FROM ";
559                 $sSQL .= "          place_addressline s, ";
560                 $sSQL .= "          placex p";
561                 $sSQL .= "        WHERE s.place_id = min(blub.parent_place_id)";
562                 $sSQL .= "          AND p.place_id = s.address_place_id ";
563                 $sSQL .= "          AND s.isaddress";
564                 $sSQL .= "          AND p.importance is not null";
565                 $sSQL .= "     ) AS addressimportance, ";
566                 $sSQL .= "     null AS extra_place ";
567                 $sSQL .= " FROM (";
568                 $sSQL .= "     SELECT place_id, ";    // interpolate the Tiger housenumbers here
569                 $sSQL .= "         ST_LineInterpolatePoint(linegeo, (housenumber_for_place-startnumber::float)/(endnumber-startnumber)::float) AS centroid, ";
570                 $sSQL .= "         parent_place_id, ";
571                 $sSQL .= "         housenumber_for_place";
572                 $sSQL .= "     FROM (";
573                 $sSQL .= "            location_property_tiger ";
574                 $sSQL .= "            JOIN (values ".$sHousenumbers.") AS housenumbers(place_id, housenumber_for_place) USING(place_id)) ";
575                 $sSQL .= "     WHERE ";
576                 $sSQL .= "         housenumber_for_place>=0";
577                 $sSQL .= "         AND 30 between $this->iMinAddressRank AND $this->iMaxAddressRank";
578                 $sSQL .= " ) AS blub"; //postgres wants an alias here
579                 $sSQL .= " GROUP BY";
580                 $sSQL .= "      place_id, ";
581                 $sSQL .= "      housenumber_for_place"; //is this group by really needed?, place_id + housenumber (in combination) are unique
582                 if (!$this->bDeDupe) $sSQL .= ", place_id ";
583             }
584             // osmline
585             // interpolation line search only if a housenumber was searched and if it was found (i.e. aPlaceIDs[placeID] = housenumber != -1) (realized through a join)
586             $sSQL .= " UNION ";
587             $sSQL .= "SELECT ";
588             $sSQL .= "  'W' AS osm_type, ";
589             $sSQL .= "  osm_id, ";
590             $sSQL .= "  'place' AS class, ";
591             $sSQL .= "  'house' AS type, ";
592             $sSQL .= "  null AS admin_level, ";
593             $sSQL .= "  30 AS rank_search, ";
594             $sSQL .= "  30 AS rank_address, ";
595             $sSQL .= "  min(place_id) as place_id, ";
596             $sSQL .= "  min(parent_place_id) AS parent_place_id, ";
597             $sSQL .= "  country_code, ";
598             $sSQL .= "  get_address_by_language(place_id, housenumber_for_place, $sLanguagePrefArraySQL) AS langaddress, ";
599             $sSQL .= "  null AS placename, ";
600             $sSQL .= "  null AS ref, ";
601             if ($this->bIncludeExtraTags) $sSQL .= "null AS extra, ";
602             if ($this->bIncludeNameDetails) $sSQL .= "null AS names, ";
603             $sSQL .= "  AVG(st_x(centroid)) AS lon, ";
604             $sSQL .= "  AVG(st_y(centroid)) AS lat, ";
605             $sSQL .= "  ".$sImportanceSQL."-0.1 AS importance, ";  // slightly smaller than the importance for normal houses with rank 30, which is 0
606             $sSQL .= "  (";
607             $sSQL .= "     SELECT ";
608             $sSQL .= "       MAX(p.importance*(p.rank_address+2)) ";
609             $sSQL .= "     FROM";
610             $sSQL .= "       place_addressline s, ";
611             $sSQL .= "       placex p";
612             $sSQL .= "     WHERE s.place_id = min(blub.parent_place_id) ";
613             $sSQL .= "       AND p.place_id = s.address_place_id ";
614             $sSQL .= "       AND s.isaddress ";
615             $sSQL .= "       AND p.importance is not null";
616             $sSQL .= "  ) AS addressimportance,";
617             $sSQL .= "  null AS extra_place ";
618             $sSQL .= "  FROM (";
619             $sSQL .= "     SELECT ";
620             $sSQL .= "         osm_id, ";
621             $sSQL .= "         place_id, ";
622             $sSQL .= "         country_code, ";
623             $sSQL .= "         CASE ";             // interpolate the housenumbers here
624             $sSQL .= "           WHEN startnumber != endnumber ";
625             $sSQL .= "           THEN ST_LineInterpolatePoint(linegeo, (housenumber_for_place-startnumber::float)/(endnumber-startnumber)::float) ";
626             $sSQL .= "           ELSE ST_LineInterpolatePoint(linegeo, 0.5) ";
627             $sSQL .= "         END as centroid, ";
628             $sSQL .= "         parent_place_id, ";
629             $sSQL .= "         housenumber_for_place ";
630             $sSQL .= "     FROM (";
631             $sSQL .= "            location_property_osmline ";
632             $sSQL .= "            JOIN (values ".$sHousenumbers.") AS housenumbers(place_id, housenumber_for_place) USING(place_id)";
633             $sSQL .= "          ) ";
634             $sSQL .= "     WHERE housenumber_for_place>=0 ";
635             $sSQL .= "       AND 30 between $this->iMinAddressRank AND $this->iMaxAddressRank";
636             $sSQL .= "  ) as blub"; //postgres wants an alias here
637             $sSQL .= "  GROUP BY ";
638             $sSQL .= "    osm_id, ";
639             $sSQL .= "    place_id, ";
640             $sSQL .= "    housenumber_for_place, ";
641             $sSQL .= "    country_code "; //is this group by really needed?, place_id + housenumber (in combination) are unique
642             if (!$this->bDeDupe) $sSQL .= ", place_id ";
643
644             if (CONST_Use_Aux_Location_data) {
645                 $sSQL .= " UNION ";
646                 $sSQL .= "  SELECT ";
647                 $sSQL .= "     'L' AS osm_type, ";
648                 $sSQL .= "     place_id AS osm_id, ";
649                 $sSQL .= "     'place' AS class,";
650                 $sSQL .= "     'house' AS type, ";
651                 $sSQL .= "     null AS admin_level, ";
652                 $sSQL .= "     0 AS rank_search,";
653                 $sSQL .= "     0 AS rank_address, ";
654                 $sSQL .= "     min(place_id) AS place_id,";
655                 $sSQL .= "     min(parent_place_id) AS parent_place_id, ";
656                 $sSQL .= "     'us' AS country_code, ";
657                 $sSQL .= "     get_address_by_language(place_id, -1, $sLanguagePrefArraySQL) AS langaddress, ";
658                 $sSQL .= "     null AS placename, ";
659                 $sSQL .= "     null AS ref, ";
660                 if ($this->bIncludeExtraTags) $sSQL .= "null AS extra, ";
661                 if ($this->bIncludeNameDetails) $sSQL .= "null AS names, ";
662                 $sSQL .= "     avg(ST_X(centroid)) AS lon, ";
663                 $sSQL .= "     avg(ST_Y(centroid)) AS lat, ";
664                 $sSQL .= "     ".$sImportanceSQL."-1.10 AS importance, ";
665                 $sSQL .= "     ( ";
666                 $sSQL .= "       SELECT max(p.importance*(p.rank_address+2))";
667                 $sSQL .= "       FROM ";
668                 $sSQL .= "          place_addressline s, ";
669                 $sSQL .= "          placex p";
670                 $sSQL .= "       WHERE s.place_id = min(location_property_aux.parent_place_id)";
671                 $sSQL .= "         AND p.place_id = s.address_place_id ";
672                 $sSQL .= "         AND s.isaddress";
673                 $sSQL .= "         AND p.importance is not null";
674                 $sSQL .= "     ) AS addressimportance, ";
675                 $sSQL .= "     null AS extra_place ";
676                 $sSQL .= "  FROM location_property_aux ";
677                 $sSQL .= "  WHERE place_id in ($sPlaceIDs) ";
678                 $sSQL .= "    AND 30 between $this->iMinAddressRank and $this->iMaxAddressRank ";
679                 $sSQL .= "  GROUP BY ";
680                 $sSQL .= "     place_id, ";
681                 if (!$this->bDeDupe) $sSQL .= "place_id, ";
682                 $sSQL .= "     get_address_by_language(place_id, -1, $sLanguagePrefArraySQL) ";
683             }
684         }
685
686         $sSQL .= " order by importance desc";
687         if (CONST_Debug) {
688             echo "<hr>";
689             var_dump($sSQL);
690         }
691         $aSearchResults = chksql(
692             $this->oDB->getAll($sSQL),
693             "Could not get details for place."
694         );
695
696         return $aSearchResults;
697     }
698
699     public function getGroupedSearches($aSearches, $aPhraseTypes, $aPhrases, $aValidTokens, $aWordFrequencyScores, $bStructuredPhrases, $sNormQuery)
700     {
701         /*
702              Calculate all searches using aValidTokens i.e.
703              'Wodsworth Road, Sheffield' =>
704
705              Phrase Wordset
706              0      0       (wodsworth road)
707              0      1       (wodsworth)(road)
708              1      0       (sheffield)
709
710              Score how good the search is so they can be ordered
711          */
712         $iGlobalRank = 0;
713
714         foreach ($aPhrases as $iPhrase => $aPhrase) {
715             $aNewPhraseSearches = array();
716             if ($bStructuredPhrases) $sPhraseType = $aPhraseTypes[$iPhrase];
717             else $sPhraseType = '';
718
719             foreach ($aPhrase['wordsets'] as $iWordSet => $aWordset) {
720                 // Too many permutations - too expensive
721                 if ($iWordSet > 120) break;
722
723                 $aWordsetSearches = $aSearches;
724
725                 // Add all words from this wordset
726                 foreach ($aWordset as $iToken => $sToken) {
727                     //echo "<br><b>$sToken</b>";
728                     $aNewWordsetSearches = array();
729
730                     foreach ($aWordsetSearches as $aCurrentSearch) {
731                         //echo "<i>";
732                         //var_dump($aCurrentSearch);
733                         //echo "</i>";
734
735                         // If the token is valid
736                         if (isset($aValidTokens[' '.$sToken])) {
737                             // TODO variable should go into aCurrentSearch
738                             $bHavePostcode = false;
739                             foreach ($aValidTokens[' '.$sToken] as $aSearchTerm) {
740                                 $aSearch = $aCurrentSearch;
741                                 $aSearch['iSearchRank']++;
742                                 if (($sPhraseType == '' || $sPhraseType == 'country') && !empty($aSearchTerm['country_code']) && $aSearchTerm['country_code'] != '0') {
743                                     if ($aSearch['sCountryCode'] === false) {
744                                         $aSearch['sCountryCode'] = strtolower($aSearchTerm['country_code']);
745                                         // Country is almost always at the end of the string - increase score for finding it anywhere else (optimisation)
746                                         if (($iToken+1 != sizeof($aWordset) || $iPhrase+1 != sizeof($aPhrases))) {
747                                             $aSearch['iSearchRank'] += 5;
748                                         }
749                                         if ($aSearch['iSearchRank'] < $this->iMaxRank) $aNewWordsetSearches[] = $aSearch;
750                                         // If it is at the beginning, we can be almost sure that this is the wrong order
751                                         // Increase score for all searches.
752                                         if ($iToken == 0 && $iPhrase == 0) {
753                                             $iGlobalRank++;
754                                         }
755                                     }
756                                 } elseif (($sPhraseType == '' || $sPhraseType == 'postalcode') && $aSearchTerm['class'] == 'place' && $aSearchTerm['type'] == 'postcode') {
757                                     // We need to try the case where the postal code is the primary element (i.e. no way to tell if it is (postalcode, city) OR (city, postalcode) so try both
758                                     if ($aSearch['sPostcode'] === '' &&
759                                         isset($aSearchTerm['word']) && $aSearchTerm['word'] && strpos($sNormQuery, $this->normTerm($aSearchTerm['word'])) !== false) {
760                                         // If we have structured search or this is the first term,
761                                         // make the postcode the primary search element.
762                                         if (!$bHavePostcode && $aSearch['sOperator'] === '' && ($sPhraseType == 'postalcode' || ($iToken == 0 && $iPhrase == 0))) {
763                                             $aNewSearch = $aSearch;
764                                             $aNewSearch['sOperator'] = 'postcode';
765                                             $aNewSearch['aAddress'] = array_merge($aNewSearch['aAddress'], $aNewSearch['aName']);
766                                             $aNewSearch['aName'] = array($aSearchTerm['word_id'] => $aSearchTerm['word']);
767                                             if ($aSearch['iSearchRank'] < $this->iMaxRank) $aNewWordsetSearches[] = $aNewSearch;
768                                             $bHavePostcode = true;
769                                         }
770
771                                         // If we have a structured search or this is not the first term,
772                                         // add the postcode as an addendum.
773                                         if ($aSearch['sOperator'] !== 'postcode' && ($sPhraseType == 'postalcode' || sizeof($aSearch['aName']))) {
774                                             $aSearch['sPostcode'] = $aSearchTerm['word'];
775                                             if ($aSearch['iSearchRank'] < $this->iMaxRank) $aNewWordsetSearches[] = $aSearch;
776                                         }
777                                     }
778                                 } elseif (($sPhraseType == '' || $sPhraseType == 'street') && $aSearchTerm['class'] == 'place' && $aSearchTerm['type'] == 'house') {
779                                     if ($aSearch['sHouseNumber'] === '' && $aSearch['sOperator'] !== 'postcode') {
780                                         $aSearch['sHouseNumber'] = $sToken;
781                                         // sanity check: if the housenumber is not mainly made
782                                         // up of numbers, add a penalty
783                                         if (preg_match_all("/[^0-9]/", $sToken, $aMatches) > 2) $aSearch['iSearchRank']++;
784                                         // also must not appear in the middle of the address
785                                         if ($aSearch['aAddress'] || $aSearch['aAddressNonSearch']) $aSearch['iSearchRank'] += 1;
786                                         if ($aSearch['iSearchRank'] < $this->iMaxRank) $aNewWordsetSearches[] = $aSearch;
787                                         /*
788                                         // Fall back to not searching for this item (better than nothing)
789                                         $aSearch = $aCurrentSearch;
790                                         $aSearch['iSearchRank'] += 1;
791                                         if ($aSearch['iSearchRank'] < $this->iMaxRank) $aNewWordsetSearches[] = $aSearch;
792                                          */
793                                     }
794                                 } elseif ($sPhraseType == '' && $aSearchTerm['class'] !== '' && $aSearchTerm['class'] !== null) {
795                                     // require a normalized exact match of the term
796                                     // if we have the normalizer version of the query
797                                     // available
798                                     if ($aSearch['sOperator'] === ''
799                                         && ($sNormQuery === null || !($aSearchTerm['word'] && strpos($sNormQuery, $aSearchTerm['word']) === false))) {
800                                         $aSearch['sClass'] = $aSearchTerm['class'];
801                                         $aSearch['sType'] = $aSearchTerm['type'];
802                                         if ($aSearchTerm['operator'] == '') {
803                                             $aSearch['sOperator'] = sizeof($aSearch['aName']) ? 'name' :  'near';
804                                             $aSearch['iSearchRank'] += 2;
805                                         } else {
806                                             $aSearch['sOperator'] = 'near'; // near = in for the moment
807                                         }
808
809                                         if ($aSearch['iSearchRank'] < $this->iMaxRank) $aNewWordsetSearches[] = $aSearch;
810                                     }
811                                 } elseif (isset($aSearchTerm['word_id']) && $aSearchTerm['word_id']) {
812                                     if (sizeof($aSearch['aName'])) {
813                                         if ((!$bStructuredPhrases || $iPhrase > 0) && $sPhraseType != 'country' && (!isset($aValidTokens[$sToken]) || strpos($sToken, ' ') !== false)) {
814                                             $aSearch['aAddress'][$aSearchTerm['word_id']] = $aSearchTerm['word_id'];
815                                         } else {
816                                             $aCurrentSearch['aFullNameAddress'][$aSearchTerm['word_id']] = $aSearchTerm['word_id'];
817                                             $aSearch['iSearchRank'] += 1000; // skip;
818                                         }
819                                     } else {
820                                         $aSearch['aName'][$aSearchTerm['word_id']] = $aSearchTerm['word_id'];
821                                         //$aSearch['iNamePhrase'] = $iPhrase;
822                                     }
823                                     if ($aSearch['iSearchRank'] < $this->iMaxRank) $aNewWordsetSearches[] = $aSearch;
824                                 }
825                             }
826                         }
827                         // Look for partial matches.
828                         // Note that there is no point in adding country terms here
829                         // because country are omitted in the address.
830                         if (isset($aValidTokens[$sToken]) && $sPhraseType != 'country') {
831                             // Allow searching for a word - but at extra cost
832                             foreach ($aValidTokens[$sToken] as $aSearchTerm) {
833                                 if (isset($aSearchTerm['word_id']) && $aSearchTerm['word_id']) {
834                                     if ((!$bStructuredPhrases || $iPhrase > 0) && sizeof($aCurrentSearch['aName']) && strpos($sToken, ' ') === false) {
835                                         $aSearch = $aCurrentSearch;
836                                         $aSearch['iSearchRank'] += 1;
837                                         if ($aWordFrequencyScores[$aSearchTerm['word_id']] < CONST_Max_Word_Frequency) {
838                                             $aSearch['aAddress'][$aSearchTerm['word_id']] = $aSearchTerm['word_id'];
839                                             if ($aSearch['iSearchRank'] < $this->iMaxRank) $aNewWordsetSearches[] = $aSearch;
840                                         } elseif (isset($aValidTokens[' '.$sToken])) { // revert to the token version?
841                                             $aSearch['aAddressNonSearch'][$aSearchTerm['word_id']] = $aSearchTerm['word_id'];
842                                             $aSearch['iSearchRank'] += 1;
843                                             if ($aSearch['iSearchRank'] < $this->iMaxRank) $aNewWordsetSearches[] = $aSearch;
844                                             foreach ($aValidTokens[' '.$sToken] as $aSearchTermToken) {
845                                                 if (empty($aSearchTermToken['country_code'])
846                                                     && empty($aSearchTermToken['lat'])
847                                                     && empty($aSearchTermToken['class'])
848                                                 ) {
849                                                     $aSearch = $aCurrentSearch;
850                                                     $aSearch['iSearchRank'] += 1;
851                                                     $aSearch['aAddress'][$aSearchTermToken['word_id']] = $aSearchTermToken['word_id'];
852                                                     if ($aSearch['iSearchRank'] < $this->iMaxRank) $aNewWordsetSearches[] = $aSearch;
853                                                 }
854                                             }
855                                         } else {
856                                             $aSearch['aAddressNonSearch'][$aSearchTerm['word_id']] = $aSearchTerm['word_id'];
857                                             if (preg_match('#^[0-9]+$#', $sToken)) $aSearch['iSearchRank'] += 2;
858                                             if ($aSearch['iSearchRank'] < $this->iMaxRank) $aNewWordsetSearches[] = $aSearch;
859                                         }
860                                     }
861
862                                     if ((!$aCurrentSearch['sPostcode'] && !$aCurrentSearch['aAddress'] && !$aCurrentSearch['aAddressNonSearch'])
863                                         && (!sizeof($aCurrentSearch['aName']) || $aCurrentSearch['iNamePhrase'] == $iPhrase)) {
864                                         $aSearch = $aCurrentSearch;
865                                         $aSearch['iSearchRank'] += 1;
866                                         if (!sizeof($aCurrentSearch['aName'])) $aSearch['iSearchRank'] += 1;
867                                         if (preg_match('#^[0-9]+$#', $sToken)) $aSearch['iSearchRank'] += 2;
868                                         if ($aWordFrequencyScores[$aSearchTerm['word_id']] < CONST_Max_Word_Frequency) {
869                                             $aSearch['aName'][$aSearchTerm['word_id']] = $aSearchTerm['word_id'];
870                                         } else {
871                                             $aSearch['aNameNonSearch'][$aSearchTerm['word_id']] = $aSearchTerm['word_id'];
872                                         }
873                                         $aSearch['iNamePhrase'] = $iPhrase;
874                                         if ($aSearch['iSearchRank'] < $this->iMaxRank) $aNewWordsetSearches[] = $aSearch;
875                                     }
876                                 }
877                             }
878                         } else {
879                             // Allow skipping a word - but at EXTREAM cost
880                             //$aSearch = $aCurrentSearch;
881                             //$aSearch['iSearchRank']+=100;
882                             //$aNewWordsetSearches[] = $aSearch;
883                         }
884                     }
885                     // Sort and cut
886                     usort($aNewWordsetSearches, 'bySearchRank');
887                     $aWordsetSearches = array_slice($aNewWordsetSearches, 0, 50);
888                 }
889                 //var_Dump('<hr>',sizeof($aWordsetSearches)); exit;
890
891                 $aNewPhraseSearches = array_merge($aNewPhraseSearches, $aNewWordsetSearches);
892                 usort($aNewPhraseSearches, 'bySearchRank');
893
894                 $aSearchHash = array();
895                 foreach ($aNewPhraseSearches as $iSearch => $aSearch) {
896                     $sHash = serialize($aSearch);
897                     if (isset($aSearchHash[$sHash])) unset($aNewPhraseSearches[$iSearch]);
898                     else $aSearchHash[$sHash] = 1;
899                 }
900
901                 $aNewPhraseSearches = array_slice($aNewPhraseSearches, 0, 50);
902             }
903
904             // Re-group the searches by their score, junk anything over 20 as just not worth trying
905             $aGroupedSearches = array();
906             foreach ($aNewPhraseSearches as $aSearch) {
907                 if ($aSearch['iSearchRank'] < $this->iMaxRank) {
908                     if (!isset($aGroupedSearches[$aSearch['iSearchRank']])) $aGroupedSearches[$aSearch['iSearchRank']] = array();
909                     $aGroupedSearches[$aSearch['iSearchRank']][] = $aSearch;
910                 }
911             }
912             ksort($aGroupedSearches);
913
914             $iSearchCount = 0;
915             $aSearches = array();
916             foreach ($aGroupedSearches as $iScore => $aNewSearches) {
917                 $iSearchCount += sizeof($aNewSearches);
918                 $aSearches = array_merge($aSearches, $aNewSearches);
919                 if ($iSearchCount > 50) break;
920             }
921
922             //if (CONST_Debug) _debugDumpGroupedSearches($aGroupedSearches, $aValidTokens);
923         }
924
925         // Revisit searches, giving penalty to unlikely combinations
926         $aGroupedSearches = array();
927         foreach ($aSearches as $aSearch) {
928             if (!$aSearch['aName']) {
929                 if ($aSearch['sHouseNumber']) {
930                     continue;
931                 }
932             }
933             $aSearch['iSearchRank'] += $iGlobalRank;
934             $aGroupedSearches[$aSearch['iSearchRank']][] = $aSearch;
935         }
936         ksort($aGroupedSearches);
937
938         return $aGroupedSearches;
939     }
940
941     /* Perform the actual query lookup.
942
943         Returns an ordered list of results, each with the following fields:
944             osm_type: type of corresponding OSM object
945                         N - node
946                         W - way
947                         R - relation
948                         P - postcode (internally computed)
949             osm_id: id of corresponding OSM object
950             class: general object class (corresponds to tag key of primary OSM tag)
951             type: subclass of object (corresponds to tag value of primary OSM tag)
952             admin_level: see http://wiki.openstreetmap.org/wiki/Admin_level
953             rank_search: rank in search hierarchy
954                         (see also http://wiki.openstreetmap.org/wiki/Nominatim/Development_overview#Country_to_street_level)
955             rank_address: rank in address hierarchy (determines orer in address)
956             place_id: internal key (may differ between different instances)
957             country_code: ISO country code
958             langaddress: localized full address
959             placename: localized name of object
960             ref: content of ref tag (if available)
961             lon: longitude
962             lat: latitude
963             importance: importance of place based on Wikipedia link count
964             addressimportance: cumulated importance of address elements
965             extra_place: type of place (for admin boundaries, if there is a place tag)
966             aBoundingBox: bounding Box
967             label: short description of the object class/type (English only)
968             name: full name (currently the same as langaddress)
969             foundorder: secondary ordering for places with same importance
970     */
971
972
973     public function lookup()
974     {
975         if (!$this->sQuery && !$this->aStructuredQuery) return array();
976
977         $sNormQuery = $this->normTerm($this->sQuery);
978         $sLanguagePrefArraySQL = "ARRAY[".join(',', array_map("getDBQuoted", $this->aLangPrefOrder))."]";
979         $sCountryCodesSQL = false;
980         if ($this->aCountryCodes) {
981             $sCountryCodesSQL = join(',', array_map('addQuotes', $this->aCountryCodes));
982         }
983
984         $sQuery = $this->sQuery;
985         if (!preg_match('//u', $sQuery)) {
986             userError("Query string is not UTF-8 encoded.");
987         }
988
989         // Conflicts between US state abreviations and various words for 'the' in different languages
990         if (isset($this->aLangPrefOrder['name:en'])) {
991             $sQuery = preg_replace('/(^|,)\s*il\s*(,|$)/', '\1illinois\2', $sQuery);
992             $sQuery = preg_replace('/(^|,)\s*al\s*(,|$)/', '\1alabama\2', $sQuery);
993             $sQuery = preg_replace('/(^|,)\s*la\s*(,|$)/', '\1louisiana\2', $sQuery);
994         }
995
996         $bBoundingBoxSearch = $this->bBoundedSearch && $this->sViewboxSmallSQL;
997         if ($this->sViewboxCentreSQL) {
998             // For complex viewboxes (routes) precompute the bounding geometry
999             $sGeom = chksql(
1000                 $this->oDB->getOne("select ".$this->sViewboxSmallSQL),
1001                 "Could not get small viewbox"
1002             );
1003             $this->sViewboxSmallSQL = "'".$sGeom."'::geometry";
1004
1005             $sGeom = chksql(
1006                 $this->oDB->getOne("select ".$this->sViewboxLargeSQL),
1007                 "Could not get large viewbox"
1008             );
1009             $this->sViewboxLargeSQL = "'".$sGeom."'::geometry";
1010         }
1011
1012         // Do we have anything that looks like a lat/lon pair?
1013         $oNearPoint = false;
1014         if ($aLooksLike = NearPoint::extractFromQuery($sQuery)) {
1015             $oNearPoint = $aLooksLike['pt'];
1016             $sQuery = $aLooksLike['query'];
1017         }
1018
1019         $aSearchResults = array();
1020         if ($sQuery || $this->aStructuredQuery) {
1021             // Start with a blank search
1022             $aSearches = array(
1023                           array(
1024                            'iSearchRank' => 0,
1025                            'iNamePhrase' => -1,
1026                            'sCountryCode' => false,
1027                            'aName' => array(),
1028                            'aAddress' => array(),
1029                            'aFullNameAddress' => array(),
1030                            'aNameNonSearch' => array(),
1031                            'aAddressNonSearch' => array(),
1032                            'sOperator' => '',
1033                            'aFeatureName' => array(),
1034                            'sClass' => '',
1035                            'sType' => '',
1036                            'sHouseNumber' => '',
1037                            'sPostcode' => '',
1038                            'oNear' => $oNearPoint
1039                           )
1040                          );
1041
1042             // Any 'special' terms in the search?
1043             $bSpecialTerms = false;
1044             preg_match_all('/\\[([\\w_]*)=([\\w_]*)\\]/', $sQuery, $aSpecialTermsRaw, PREG_SET_ORDER);
1045             foreach ($aSpecialTermsRaw as $aSpecialTerm) {
1046                 $sQuery = str_replace($aSpecialTerm[0], ' ', $sQuery);
1047                 if (!$bSpecialTerms) {
1048                     $aNewSearches = array();
1049                     foreach ($aSearches as $aSearch) {
1050                         $aNewSearch = $aSearch;
1051                         $aNewSearch['sClass'] = $aSpecialTerm[1];
1052                         $aNewSearch['sType'] = $aSpecialTerm[2];
1053                         $aNewSearches[] = $aNewSearch;
1054                     }
1055
1056                     $aSearches = $aNewSearches;
1057                     $bSpecialTerms = true;
1058                 }
1059             }
1060
1061             preg_match_all('/\\[([\\w ]*)\\]/u', $sQuery, $aSpecialTermsRaw, PREG_SET_ORDER);
1062             if (isset($this->aStructuredQuery['amenity']) && $this->aStructuredQuery['amenity']) {
1063                 $aSpecialTermsRaw[] = array('['.$this->aStructuredQuery['amenity'].']', $this->aStructuredQuery['amenity']);
1064                 unset($this->aStructuredQuery['amenity']);
1065             }
1066
1067             foreach ($aSpecialTermsRaw as $aSpecialTerm) {
1068                 $sQuery = str_replace($aSpecialTerm[0], ' ', $sQuery);
1069                 if ($bSpecialTerms) {
1070                     continue;
1071                 }
1072
1073                 $sToken = chksql($this->oDB->getOne("SELECT make_standard_name('".pg_escape_string($aSpecialTerm[1])."') AS string"));
1074                 $sSQL = 'SELECT * ';
1075                 $sSQL .= 'FROM ( ';
1076                 $sSQL .= '   SELECT word_id, word_token, word, class, type, country_code, operator';
1077                 $sSQL .= '   FROM word ';
1078                 $sSQL .= '   WHERE word_token in (\' '.$sToken.'\')';
1079                 $sSQL .= ') AS x ';
1080                 $sSQL .= ' WHERE (class is not null AND class not in (\'place\'))';
1081                 if (CONST_Debug) var_Dump($sSQL);
1082                 $aSearchWords = chksql($this->oDB->getAll($sSQL));
1083                 $aNewSearches = array();
1084                 foreach ($aSearches as $aSearch) {
1085                     foreach ($aSearchWords as $aSearchTerm) {
1086                         $aNewSearch = $aSearch;
1087                         $aNewSearch['sClass'] = $aSearchTerm['class'];
1088                         $aNewSearch['sType'] = $aSearchTerm['type'];
1089                         $aNewSearches[] = $aNewSearch;
1090                         $bSpecialTerms = true;
1091                     }
1092                 }
1093                 $aSearches = $aNewSearches;
1094             }
1095
1096             // Split query into phrases
1097             // Commas are used to reduce the search space by indicating where phrases split
1098             if ($this->aStructuredQuery) {
1099                 $aPhrases = $this->aStructuredQuery;
1100                 $bStructuredPhrases = true;
1101             } else {
1102                 $aPhrases = explode(',', $sQuery);
1103                 $bStructuredPhrases = false;
1104             }
1105
1106             // Convert each phrase to standard form
1107             // Create a list of standard words
1108             // Get all 'sets' of words
1109             // Generate a complete list of all
1110             $aTokens = array();
1111             foreach ($aPhrases as $iPhrase => $sPhrase) {
1112                 $aPhrase = chksql(
1113                     $this->oDB->getRow("SELECT make_standard_name('".pg_escape_string($sPhrase)."') as string"),
1114                     "Cannot normalize query string (is it a UTF-8 string?)"
1115                 );
1116                 if (trim($aPhrase['string'])) {
1117                     $aPhrases[$iPhrase] = $aPhrase;
1118                     $aPhrases[$iPhrase]['words'] = explode(' ', $aPhrases[$iPhrase]['string']);
1119                     $aPhrases[$iPhrase]['wordsets'] = getWordSets($aPhrases[$iPhrase]['words'], 0);
1120                     $aTokens = array_merge($aTokens, getTokensFromSets($aPhrases[$iPhrase]['wordsets']));
1121                 } else {
1122                     unset($aPhrases[$iPhrase]);
1123                 }
1124             }
1125
1126             // Reindex phrases - we make assumptions later on that they are numerically keyed in order
1127             $aPhraseTypes = array_keys($aPhrases);
1128             $aPhrases = array_values($aPhrases);
1129
1130             if (sizeof($aTokens)) {
1131                 // Check which tokens we have, get the ID numbers
1132                 $sSQL = 'SELECT word_id, word_token, word, class, type, country_code, operator, search_name_count';
1133                 $sSQL .= ' FROM word ';
1134                 $sSQL .= ' WHERE word_token in ('.join(',', array_map("getDBQuoted", $aTokens)).')';
1135
1136                 if (CONST_Debug) var_Dump($sSQL);
1137
1138                 $aValidTokens = array();
1139                 $aDatabaseWords = chksql(
1140                     $this->oDB->getAll($sSQL),
1141                     "Could not get word tokens."
1142                 );
1143                 $aPossibleMainWordIDs = array();
1144                 $aWordFrequencyScores = array();
1145                 foreach ($aDatabaseWords as $aToken) {
1146                     // Very special case - require 2 letter country param to match the country code found
1147                     if ($bStructuredPhrases && $aToken['country_code'] && !empty($this->aStructuredQuery['country'])
1148                         && strlen($this->aStructuredQuery['country']) == 2 && strtolower($this->aStructuredQuery['country']) != $aToken['country_code']
1149                     ) {
1150                         continue;
1151                     }
1152
1153                     if (isset($aValidTokens[$aToken['word_token']])) {
1154                         $aValidTokens[$aToken['word_token']][] = $aToken;
1155                     } else {
1156                         $aValidTokens[$aToken['word_token']] = array($aToken);
1157                     }
1158                     if (!$aToken['class'] && !$aToken['country_code']) $aPossibleMainWordIDs[$aToken['word_id']] = 1;
1159                     $aWordFrequencyScores[$aToken['word_id']] = $aToken['search_name_count'] + 1;
1160                 }
1161                 if (CONST_Debug) var_Dump($aPhrases, $aValidTokens);
1162
1163                 // US ZIP+4 codes - if there is no token, merge in the 5-digit ZIP code
1164                 foreach ($aTokens as $sToken) {
1165                     if (!isset($aValidTokens[$sToken]) && preg_match('/^([0-9]{5}) [0-9]{4}$/', $sToken, $aData)) {
1166                         if (isset($aValidTokens[$aData[1]])) {
1167                             foreach ($aValidTokens[$aData[1]] as $aToken) {
1168                                 if (!$aToken['class']) {
1169                                     if (isset($aValidTokens[$sToken])) {
1170                                         $aValidTokens[$sToken][] = $aToken;
1171                                     } else {
1172                                         $aValidTokens[$sToken] = array($aToken);
1173                                     }
1174                                 }
1175                             }
1176                         }
1177                     }
1178                 }
1179
1180                 foreach ($aTokens as $sToken) {
1181                     // Unknown single word token with a number - assume it is a house number
1182                     if (!isset($aValidTokens[' '.$sToken]) && strpos($sToken, ' ') === false && preg_match('/[0-9]/', $sToken)) {
1183                         $aValidTokens[' '.$sToken] = array(array('class' => 'place', 'type' => 'house'));
1184                     }
1185                 }
1186
1187                 // Any words that have failed completely?
1188                 // TODO: suggestions
1189
1190                 // Start the search process
1191                 // array with: placeid => -1 | tiger-housenumber
1192                 $aResultPlaceIDs = array();
1193
1194                 $aGroupedSearches = $this->getGroupedSearches($aSearches, $aPhraseTypes, $aPhrases, $aValidTokens, $aWordFrequencyScores, $bStructuredPhrases, $sNormQuery);
1195
1196                 if ($this->bReverseInPlan) {
1197                     // Reverse phrase array and also reverse the order of the wordsets in
1198                     // the first and final phrase. Don't bother about phrases in the middle
1199                     // because order in the address doesn't matter.
1200                     $aPhrases = array_reverse($aPhrases);
1201                     $aPhrases[0]['wordsets'] = getInverseWordSets($aPhrases[0]['words'], 0);
1202                     if (sizeof($aPhrases) > 1) {
1203                         $aFinalPhrase = end($aPhrases);
1204                         $aPhrases[sizeof($aPhrases)-1]['wordsets'] = getInverseWordSets($aFinalPhrase['words'], 0);
1205                     }
1206                     $aReverseGroupedSearches = $this->getGroupedSearches($aSearches, null, $aPhrases, $aValidTokens, $aWordFrequencyScores, false, $sNormQuery);
1207
1208                     foreach ($aGroupedSearches as $aSearches) {
1209                         foreach ($aSearches as $aSearch) {
1210                             if ($aSearch['iSearchRank'] < $this->iMaxRank) {
1211                                 if (!isset($aReverseGroupedSearches[$aSearch['iSearchRank']])) $aReverseGroupedSearches[$aSearch['iSearchRank']] = array();
1212                                 $aReverseGroupedSearches[$aSearch['iSearchRank']][] = $aSearch;
1213                             }
1214                         }
1215                     }
1216
1217                     $aGroupedSearches = $aReverseGroupedSearches;
1218                     ksort($aGroupedSearches);
1219                 }
1220             } else {
1221                 // Re-group the searches by their score, junk anything over 20 as just not worth trying
1222                 $aGroupedSearches = array();
1223                 foreach ($aSearches as $aSearch) {
1224                     if ($aSearch['iSearchRank'] < $this->iMaxRank) {
1225                         if (!isset($aGroupedSearches[$aSearch['iSearchRank']])) $aGroupedSearches[$aSearch['iSearchRank']] = array();
1226                         $aGroupedSearches[$aSearch['iSearchRank']][] = $aSearch;
1227                     }
1228                 }
1229                 ksort($aGroupedSearches);
1230             }
1231
1232             // Filter out duplicate searches
1233             $aSearchHash = array();
1234             foreach ($aGroupedSearches as $iGroup => $aSearches) {
1235                 foreach ($aSearches as $iSearch => $aSearch) {
1236                     $sHash = serialize($aSearch);
1237                     if (isset($aSearchHash[$sHash])) {
1238                         unset($aGroupedSearches[$iGroup][$iSearch]);
1239                         if (sizeof($aGroupedSearches[$iGroup]) == 0) unset($aGroupedSearches[$iGroup]);
1240                     } else {
1241                         $aSearchHash[$sHash] = 1;
1242                     }
1243                 }
1244             }
1245
1246             if (CONST_Debug) _debugDumpGroupedSearches($aGroupedSearches, $aValidTokens);
1247
1248             $iGroupLoop = 0;
1249             $iQueryLoop = 0;
1250             foreach ($aGroupedSearches as $iGroupedRank => $aSearches) {
1251                 $iGroupLoop++;
1252                 foreach ($aSearches as $aSearch) {
1253                     $iQueryLoop++;
1254                     $searchedHousenumber = -1;
1255
1256                     if (CONST_Debug) echo "<hr><b>Search Loop, group $iGroupLoop, loop $iQueryLoop</b>";
1257                     if (CONST_Debug) _debugDumpGroupedSearches(array($iGroupedRank => array($aSearch)), $aValidTokens);
1258
1259                     if ($sCountryCodesSQL && $aSearch['sCountryCode'] && !in_array($aSearch['sCountryCode'], $this->aCountryCodes)) {
1260                         continue;
1261                     }
1262
1263                     // No location term?
1264                     if (!sizeof($aSearch['aName']) && !sizeof($aSearch['aAddress'])) {
1265                         if ($aSearch['sCountryCode'] && !$aSearch['sClass'] && !$aSearch['sHouseNumber'] && !$aSearch['oNear']) {
1266                             // Just looking for a country by code - look it up
1267                             if (4 >= $this->iMinAddressRank && 4 <= $this->iMaxAddressRank) {
1268                                 $sSQL = "SELECT place_id FROM placex WHERE country_code='".$aSearch['sCountryCode']."' AND rank_search = 4";
1269                                 if ($bBoundingBoxSearch)
1270                                     $sSQL .= " AND _st_intersects($this->sViewboxSmallSQL, geometry)";
1271                                 $sSQL .= " ORDER BY st_area(geometry) DESC LIMIT 1";
1272                                 if (CONST_Debug) var_dump($sSQL);
1273                                 $aPlaceIDs = chksql($this->oDB->getCol($sSQL));
1274                             } else {
1275                                 $aPlaceIDs = array();
1276                             }
1277                         } else {
1278                             if (!$bBoundingBoxSearch && !$aSearch['oNear']) continue;
1279                             if (!$aSearch['sClass']) continue;
1280
1281                             $sSQL = "SELECT COUNT(*) FROM pg_tables WHERE tablename = 'place_classtype_".$aSearch['sClass']."_".$aSearch['sType']."'";
1282                             if (chksql($this->oDB->getOne($sSQL))) {
1283                                 $sSQL = "SELECT place_id FROM place_classtype_".$aSearch['sClass']."_".$aSearch['sType']." ct";
1284                                 if ($sCountryCodesSQL) $sSQL .= " JOIN placex USING (place_id)";
1285                                 if ($aSearch['oNear']) {
1286                                     $sSQL .= " WHERE ".$aSearch['oNear']->withinSQL('ct.centroid');
1287                                 } else {
1288                                     $sSQL .= " WHERE st_contains($this->sViewboxSmallSQL, ct.centroid)";
1289                                 }
1290                                 if ($sCountryCodesSQL) $sSQL .= " AND country_code in ($sCountryCodesSQL)";
1291                                 if (sizeof($this->aExcludePlaceIDs)) {
1292                                     $sSQL .= " AND place_id not in (".join(',', $this->aExcludePlaceIDs).")";
1293                                 }
1294                                 if ($this->sViewboxCentreSQL) {
1295                                     $sSQL .= " ORDER BY ST_Distance($this->sViewboxCentreSQL, ct.centroid) ASC";
1296                                 } elseif ($aSearch['oNear']) {
1297                                     $sSQL .= " ORDER BY ".$aSearch['oNear']->distanceSQL('ct.centroid').' ASC';
1298                                 }
1299                                 $sSQL .= " limit $this->iLimit";
1300                                 if (CONST_Debug) var_dump($sSQL);
1301                                 $aPlaceIDs = chksql($this->oDB->getCol($sSQL));
1302                             } else if ($aSearch['oNear']) {
1303                                 $sSQL = "SELECT place_id ";
1304                                 $sSQL .= "FROM placex ";
1305                                 $sSQL .= "WHERE class='".$aSearch['sClass']."' ";
1306                                 $sSQL .= "  AND type='".$aSearch['sType']."'";
1307                                 $sSQL .= "  AND ".$aSearch['oNear']->withinSQL('geometry');
1308                                 $sSQL .= "  AND linked_place_id is null";
1309                                 if ($sCountryCodesSQL) $sSQL .= " AND country_code in ($sCountryCodesSQL)";
1310                                 $sSQL .= " ORDER BY ".$aSearch['oNear']->distanceSQL('centroid')." ASC";
1311                                 $sSQL .= " LIMIT $this->iLimit";
1312                                 if (CONST_Debug) var_dump($sSQL);
1313                                 $aPlaceIDs = chksql($this->oDB->getCol($sSQL));
1314                             }
1315                         }
1316                     } elseif ($aSearch['oNear'] && !sizeof($aSearch['aName']) && !sizeof($aSearch['aAddress']) && !$aSearch['sClass']) {
1317                         // If a coordinate is given, the search must either
1318                         // be for a name or a special search. Ignore everythin else.
1319                         $aPlaceIDs = array();
1320                     } elseif ($aSearch['sOperator'] == 'postcode') {
1321                         $sSQL  = "SELECT p.place_id FROM location_postcode p ";
1322                         if (sizeof($aSearch['aAddress'])) {
1323                             $sSQL .= ", search_name s ";
1324                             $sSQL .= "WHERE s.place_id = p.parent_place_id ";
1325                             $sSQL .= "AND array_cat(s.nameaddress_vector, s.name_vector) @> ARRAY[".join($aSearch['aAddress'], ",")."] AND ";
1326                         } else {
1327                             $sSQL .= " WHERE ";
1328                         }
1329                         $sSQL .= "p.postcode = '".pg_escape_string(reset($aSearch['aName']))."'";
1330                         if ($aSearch['sCountryCode']) {
1331                             $sSQL .= " AND p.country_code = '".$aSearch['sCountryCode']."'";
1332                         } elseif ($sCountryCodesSQL) {
1333                             $sSQL .= " AND p.country_code in ($sCountryCodesSQL)";
1334                         }
1335                         $sSQL .= " LIMIT $this->iLimit";
1336                         if (CONST_Debug) var_dump($sSQL);
1337                         $aPlaceIDs = chksql($this->oDB->getCol($sSQL));
1338                     } else {
1339                         $aPlaceIDs = array();
1340
1341                         // First we need a position, either aName or fLat or both
1342                         $aTerms = array();
1343                         $aOrder = array();
1344
1345                         if ($aSearch['sHouseNumber'] && sizeof($aSearch['aAddress'])) {
1346                             $sHouseNumberRegex = '\\\\m'.$aSearch['sHouseNumber'].'\\\\M';
1347                             $aOrder[] = "";
1348                             $aOrder[0] = "  (";
1349                             $aOrder[0] .= "   EXISTS(";
1350                             $aOrder[0] .= "     SELECT place_id ";
1351                             $aOrder[0] .= "     FROM placex ";
1352                             $aOrder[0] .= "     WHERE parent_place_id = search_name.place_id";
1353                             $aOrder[0] .= "       AND transliteration(housenumber) ~* E'".$sHouseNumberRegex."' ";
1354                             $aOrder[0] .= "     LIMIT 1";
1355                             $aOrder[0] .= "   ) ";
1356                             // also housenumbers from interpolation lines table are needed
1357                             $aOrder[0] .= "   OR EXISTS(";
1358                             $aOrder[0] .= "     SELECT place_id ";
1359                             $aOrder[0] .= "     FROM location_property_osmline ";
1360                             $aOrder[0] .= "     WHERE parent_place_id = search_name.place_id";
1361                             $aOrder[0] .= "       AND startnumber is not NULL";
1362                             $aOrder[0] .= "       AND ".intval($aSearch['sHouseNumber']).">=startnumber ";
1363                             $aOrder[0] .= "       AND ".intval($aSearch['sHouseNumber'])."<=endnumber ";
1364                             $aOrder[0] .= "     LIMIT 1";
1365                             $aOrder[0] .= "   )";
1366                             $aOrder[0] .= " )";
1367                             $aOrder[0] .= " DESC";
1368                         }
1369
1370                         // TODO: filter out the pointless search terms (2 letter name tokens and less)
1371                         // they might be right - but they are just too darned expensive to run
1372                         if (sizeof($aSearch['aName'])) $aTerms[] = "name_vector @> ARRAY[".join($aSearch['aName'], ",")."]";
1373                         if (sizeof($aSearch['aNameNonSearch'])) $aTerms[] = "array_cat(name_vector,ARRAY[]::integer[]) @> ARRAY[".join($aSearch['aNameNonSearch'], ",")."]";
1374                         if (sizeof($aSearch['aAddress']) && $aSearch['aName'] != $aSearch['aAddress']) {
1375                             // For infrequent name terms disable index usage for address
1376                             if (CONST_Search_NameOnlySearchFrequencyThreshold
1377                                 && sizeof($aSearch['aName']) == 1
1378                                 && $aWordFrequencyScores[$aSearch['aName'][reset($aSearch['aName'])]] < CONST_Search_NameOnlySearchFrequencyThreshold
1379                             ) {
1380                                 $aTerms[] = "array_cat(nameaddress_vector,ARRAY[]::integer[]) @> ARRAY[".join(array_merge($aSearch['aAddress'], $aSearch['aAddressNonSearch']), ",")."]";
1381                             } else {
1382                                 $aTerms[] = "nameaddress_vector @> ARRAY[".join($aSearch['aAddress'], ",")."]";
1383                                 if (sizeof($aSearch['aAddressNonSearch'])) {
1384                                     $aTerms[] = "array_cat(nameaddress_vector,ARRAY[]::integer[]) @> ARRAY[".join($aSearch['aAddressNonSearch'], ",")."]";
1385                                 }
1386                             }
1387                         }
1388                         if ($aSearch['sCountryCode']) $aTerms[] = "country_code = '".pg_escape_string($aSearch['sCountryCode'])."'";
1389                         if ($aSearch['sHouseNumber']) {
1390                             $aTerms[] = "address_rank between 16 and 27";
1391                         } elseif (!$aSearch['sClass'] || $aSearch['sOperator'] == 'name') {
1392                             if ($this->iMinAddressRank > 0) {
1393                                 $aTerms[] = "address_rank >= ".$this->iMinAddressRank;
1394                             }
1395                             if ($this->iMaxAddressRank < 30) {
1396                                 $aTerms[] = "address_rank <= ".$this->iMaxAddressRank;
1397                             }
1398                         }
1399                         if ($aSearch['oNear']) {
1400                             $aTerms[] = $aSearch['oNear']->withinSQL('centroid');
1401
1402                             $aOrder[] = $aSearch['oNear']->distanceSQL('centroid');
1403                         } elseif ($aSearch['sPostcode']) {
1404                             if (!sizeof($aSearch['aAddress'])) {
1405                                 $aTerms[] = "EXISTS(SELECT place_id FROM location_postcode p WHERE p.postcode = '".$aSearch['sPostcode']."' AND ST_DWithin(search_name.centroid, p.geometry, 0.1))";
1406                             } else {
1407                                 $aOrder[] = "(SELECT min(ST_Distance(search_name.centroid, p.geometry)) FROM location_postcode p WHERE p.postcode = '".$aSearch['sPostcode']."')";
1408                             }
1409                         }
1410                         if (sizeof($this->aExcludePlaceIDs)) {
1411                             $aTerms[] = "place_id not in (".join(',', $this->aExcludePlaceIDs).")";
1412                         }
1413                         if ($sCountryCodesSQL) {
1414                             $aTerms[] = "country_code in ($sCountryCodesSQL)";
1415                         }
1416
1417                         if ($bBoundingBoxSearch) $aTerms[] = "centroid && $this->sViewboxSmallSQL";
1418                         if ($oNearPoint) {
1419                             $aOrder[] = $oNearPoint->distanceSQL('centroid');
1420                         }
1421
1422                         if ($aSearch['sHouseNumber']) {
1423                             $sImportanceSQL = '- abs(26 - address_rank) + 3';
1424                         } else {
1425                             $sImportanceSQL = '(CASE WHEN importance = 0 OR importance IS NULL THEN 0.75-(search_rank::float/40) ELSE importance END)';
1426                         }
1427                         if ($this->sViewboxSmallSQL) $sImportanceSQL .= " * CASE WHEN ST_Contains($this->sViewboxSmallSQL, centroid) THEN 1 ELSE 0.5 END";
1428                         if ($this->sViewboxLargeSQL) $sImportanceSQL .= " * CASE WHEN ST_Contains($this->sViewboxLargeSQL, centroid) THEN 1 ELSE 0.5 END";
1429
1430                         $aOrder[] = "$sImportanceSQL DESC";
1431                         if (sizeof($aSearch['aFullNameAddress'])) {
1432                             $sExactMatchSQL = ' ( ';
1433                             $sExactMatchSQL .= '   SELECT count(*) FROM ( ';
1434                             $sExactMatchSQL .= '      SELECT unnest(ARRAY['.join($aSearch['aFullNameAddress'], ",").']) ';
1435                             $sExactMatchSQL .= '      INTERSECT ';
1436                             $sExactMatchSQL .= '      SELECT unnest(nameaddress_vector)';
1437                             $sExactMatchSQL .= '   ) s';
1438                             $sExactMatchSQL .= ') as exactmatch';
1439                             $aOrder[] = 'exactmatch DESC';
1440                         } else {
1441                             $sExactMatchSQL = '0::int as exactmatch';
1442                         }
1443
1444                         if (sizeof($aTerms)) {
1445                             $sSQL = "SELECT place_id, ";
1446                             $sSQL .= $sExactMatchSQL;
1447                             $sSQL .= " FROM search_name";
1448                             $sSQL .= " WHERE ".join(' and ', $aTerms);
1449                             $sSQL .= " ORDER BY ".join(', ', $aOrder);
1450                             if ($aSearch['sHouseNumber'] || $aSearch['sClass']) {
1451                                 $sSQL .= " LIMIT 20";
1452                             } elseif (!sizeof($aSearch['aName']) && !sizeof($aSearch['aAddress']) && $aSearch['sClass']) {
1453                                 $sSQL .= " LIMIT 1";
1454                             } else {
1455                                 $sSQL .= " LIMIT ".$this->iLimit;
1456                             }
1457
1458                             if (CONST_Debug) var_dump($sSQL);
1459                             $aViewBoxPlaceIDs = chksql(
1460                                 $this->oDB->getAll($sSQL),
1461                                 "Could not get places for search terms."
1462                             );
1463                             //var_dump($aViewBoxPlaceIDs);
1464                             // Did we have an viewbox matches?
1465                             $aPlaceIDs = array();
1466                             $bViewBoxMatch = false;
1467                             foreach ($aViewBoxPlaceIDs as $aViewBoxRow) {
1468                                 //if ($bViewBoxMatch == 1 && $aViewBoxRow['in_small'] == 'f') break;
1469                                 //if ($bViewBoxMatch == 2 && $aViewBoxRow['in_large'] == 'f') break;
1470                                 //if ($aViewBoxRow['in_small'] == 't') $bViewBoxMatch = 1;
1471                                 //else if ($aViewBoxRow['in_large'] == 't') $bViewBoxMatch = 2;
1472                                 $aPlaceIDs[] = $aViewBoxRow['place_id'];
1473                                 $this->exactMatchCache[$aViewBoxRow['place_id']] = $aViewBoxRow['exactmatch'];
1474                             }
1475                         }
1476                         //var_Dump($aPlaceIDs);
1477                         //exit;
1478
1479                         //now search for housenumber, if housenumber provided
1480                         if ($aSearch['sHouseNumber'] && sizeof($aPlaceIDs)) {
1481                             $searchedHousenumber = intval($aSearch['sHouseNumber']);
1482                             $aRoadPlaceIDs = $aPlaceIDs;
1483                             $sPlaceIDs = join(',', $aPlaceIDs);
1484
1485                             // Now they are indexed, look for a house attached to a street we found
1486                             $sHouseNumberRegex = '\\\\m'.$aSearch['sHouseNumber'].'\\\\M';
1487                             $sSQL = "SELECT place_id FROM placex ";
1488                             $sSQL .= "WHERE parent_place_id in (".$sPlaceIDs.") and transliteration(housenumber) ~* E'".$sHouseNumberRegex."'";
1489                             if (sizeof($this->aExcludePlaceIDs)) {
1490                                 $sSQL .= " AND place_id not in (".join(',', $this->aExcludePlaceIDs).")";
1491                             }
1492                             $sSQL .= " LIMIT $this->iLimit";
1493                             if (CONST_Debug) var_dump($sSQL);
1494                             $aPlaceIDs = chksql($this->oDB->getCol($sSQL));
1495
1496                             // if nothing found, search in the interpolation line table
1497                             if (!sizeof($aPlaceIDs)) {
1498                                 // do we need to use transliteration and the regex for housenumbers???
1499                                 //new query for lines, not housenumbers anymore
1500                                 $sSQL = "SELECT distinct place_id FROM location_property_osmline";
1501                                 $sSQL .= " WHERE startnumber is not NULL and parent_place_id in (".$sPlaceIDs.") and (";
1502                                 if ($searchedHousenumber%2 == 0) {
1503                                     //if housenumber is even, look for housenumber in streets with interpolationtype even or all
1504                                     $sSQL .= "interpolationtype='even'";
1505                                 } else {
1506                                     //look for housenumber in streets with interpolationtype odd or all
1507                                     $sSQL .= "interpolationtype='odd'";
1508                                 }
1509                                 $sSQL .= " or interpolationtype='all') and ";
1510                                 $sSQL .= $searchedHousenumber.">=startnumber and ";
1511                                 $sSQL .= $searchedHousenumber."<=endnumber";
1512
1513                                 if (sizeof($this->aExcludePlaceIDs)) {
1514                                     $sSQL .= " AND place_id not in (".join(',', $this->aExcludePlaceIDs).")";
1515                                 }
1516                                 //$sSQL .= " limit $this->iLimit";
1517                                 if (CONST_Debug) var_dump($sSQL);
1518                                 //get place IDs
1519                                 $aPlaceIDs = chksql($this->oDB->getCol($sSQL, 0));
1520                             }
1521
1522                             // If nothing found try the aux fallback table
1523                             if (CONST_Use_Aux_Location_data && !sizeof($aPlaceIDs)) {
1524                                 $sSQL = "SELECT place_id FROM location_property_aux ";
1525                                 $sSQL .= " WHERE parent_place_id in (".$sPlaceIDs.") ";
1526                                 $sSQL .= " AND housenumber = '".pg_escape_string($aSearch['sHouseNumber'])."'";
1527                                 if (sizeof($this->aExcludePlaceIDs)) {
1528                                     $sSQL .= " AND parent_place_id not in (".join(',', $this->aExcludePlaceIDs).")";
1529                                 }
1530                                 //$sSQL .= " limit $this->iLimit";
1531                                 if (CONST_Debug) var_dump($sSQL);
1532                                 $aPlaceIDs = chksql($this->oDB->getCol($sSQL));
1533                             }
1534
1535                             //if nothing was found in placex or location_property_aux, then search in Tiger data for this housenumber(location_property_tiger)
1536                             if (CONST_Use_US_Tiger_Data && !sizeof($aPlaceIDs)) {
1537                                 $sSQL = "SELECT distinct place_id FROM location_property_tiger";
1538                                 $sSQL .= " WHERE parent_place_id in (".$sPlaceIDs.") and (";
1539                                 if ($searchedHousenumber%2 == 0) {
1540                                     $sSQL .= "interpolationtype='even'";
1541                                 } else {
1542                                     $sSQL .= "interpolationtype='odd'";
1543                                 }
1544                                 $sSQL .= " or interpolationtype='all') and ";
1545                                 $sSQL .= $searchedHousenumber.">=startnumber and ";
1546                                 $sSQL .= $searchedHousenumber."<=endnumber";
1547
1548                                 if (sizeof($this->aExcludePlaceIDs)) {
1549                                     $sSQL .= " AND place_id not in (".join(',', $this->aExcludePlaceIDs).")";
1550                                 }
1551                                 //$sSQL .= " limit $this->iLimit";
1552                                 if (CONST_Debug) var_dump($sSQL);
1553                                 //get place IDs
1554                                 $aPlaceIDs = chksql($this->oDB->getCol($sSQL, 0));
1555                             }
1556
1557                             // Fallback to the road (if no housenumber was found)
1558                             if (!sizeof($aPlaceIDs) && preg_match('/[0-9]+/', $aSearch['sHouseNumber'])
1559                                 && ($aSearch['aAddress'] || $aSearch['sCountryCode'])) {
1560                                 $aPlaceIDs = $aRoadPlaceIDs;
1561                                 //set to -1, if no housenumbers were found
1562                                 $searchedHousenumber = -1;
1563                             }
1564                             //else: housenumber was found, remains saved in searchedHousenumber
1565                         }
1566
1567
1568                         if ($aSearch['sClass'] && sizeof($aPlaceIDs)) {
1569                             $sPlaceIDs = join(',', $aPlaceIDs);
1570                             $aClassPlaceIDs = array();
1571
1572                             if (!$aSearch['sOperator'] || $aSearch['sOperator'] == 'name') {
1573                                 // If they were searching for a named class (i.e. 'Kings Head pub') then we might have an extra match
1574                                 $sSQL = "SELECT place_id ";
1575                                 $sSQL .= " FROM placex ";
1576                                 $sSQL .= " WHERE place_id in ($sPlaceIDs) ";
1577                                 $sSQL .= "   AND class='".$aSearch['sClass']."' ";
1578                                 $sSQL .= "   AND type='".$aSearch['sType']."'";
1579                                 $sSQL .= "   AND linked_place_id is null";
1580                                 if ($sCountryCodesSQL) $sSQL .= " AND country_code in ($sCountryCodesSQL)";
1581                                 $sSQL .= " ORDER BY rank_search ASC ";
1582                                 $sSQL .= " LIMIT $this->iLimit";
1583                                 if (CONST_Debug) var_dump($sSQL);
1584                                 $aClassPlaceIDs = chksql($this->oDB->getCol($sSQL));
1585                             }
1586
1587                             if (!$aSearch['sOperator'] || $aSearch['sOperator'] == 'near') { // & in
1588                                 $sClassTable = 'place_classtype_'.$aSearch['sClass'].'_'.$aSearch['sType'];
1589                                 $sSQL = "SELECT count(*) FROM pg_tables ";
1590                                 $sSQL .= "WHERE tablename = '$sClassTable'";
1591                                 $bCacheTable = chksql($this->oDB->getOne($sSQL));
1592
1593                                 $sSQL = "SELECT min(rank_search) FROM placex WHERE place_id in ($sPlaceIDs)";
1594
1595                                 if (CONST_Debug) var_dump($sSQL);
1596                                 $this->iMaxRank = ((int)chksql($this->oDB->getOne($sSQL)));
1597
1598                                 // For state / country level searches the normal radius search doesn't work very well
1599                                 $sPlaceGeom = false;
1600                                 if ($this->iMaxRank < 9 && $bCacheTable) {
1601                                     // Try and get a polygon to search in instead
1602                                     $sSQL = "SELECT geometry ";
1603                                     $sSQL .= " FROM placex";
1604                                     $sSQL .= " WHERE place_id in ($sPlaceIDs)";
1605                                     $sSQL .= "   AND rank_search < $this->iMaxRank + 5";
1606                                     $sSQL .= "   AND ST_Geometrytype(geometry) in ('ST_Polygon','ST_MultiPolygon')";
1607                                     $sSQL .= " ORDER BY rank_search ASC ";
1608                                     $sSQL .= " LIMIT 1";
1609                                     if (CONST_Debug) var_dump($sSQL);
1610                                     $sPlaceGeom = chksql($this->oDB->getOne($sSQL));
1611                                 }
1612
1613                                 if ($sPlaceGeom) {
1614                                     $sPlaceIDs = false;
1615                                 } else {
1616                                     $this->iMaxRank += 5;
1617                                     $sSQL = "SELECT place_id FROM placex WHERE place_id in ($sPlaceIDs) and rank_search < $this->iMaxRank";
1618                                     if (CONST_Debug) var_dump($sSQL);
1619                                     $aPlaceIDs = chksql($this->oDB->getCol($sSQL));
1620                                     $sPlaceIDs = join(',', $aPlaceIDs);
1621                                 }
1622
1623                                 if ($sPlaceIDs || $sPlaceGeom) {
1624                                     $fRange = 0.01;
1625                                     if ($bCacheTable) {
1626                                         // More efficient - can make the range bigger
1627                                         $fRange = 0.05;
1628
1629                                         $sOrderBySQL = '';
1630                                         if ($oNearPoint) {
1631                                             $sOrderBySQL = $oNearPoint->distanceSQL('l.centroid');
1632                                         } elseif ($sPlaceIDs) {
1633                                             $sOrderBySQL = "ST_Distance(l.centroid, f.geometry)";
1634                                         } elseif ($sPlaceGeom) {
1635                                             $sOrderBySQL = "ST_Distance(st_centroid('".$sPlaceGeom."'), l.centroid)";
1636                                         }
1637
1638                                         $sSQL = "select distinct i.place_id".($sOrderBySQL?', i.order_term':'')." from (";
1639                                         $sSQL .= "select l.place_id".($sOrderBySQL?','.$sOrderBySQL.' as order_term':'')." from ".$sClassTable." as l";
1640                                         if ($sCountryCodesSQL) $sSQL .= " join placex as lp using (place_id)";
1641                                         if ($sPlaceIDs) {
1642                                             $sSQL .= ",placex as f where ";
1643                                             $sSQL .= "f.place_id in ($sPlaceIDs) and ST_DWithin(l.centroid, f.centroid, $fRange) ";
1644                                         }
1645                                         if ($sPlaceGeom) {
1646                                             $sSQL .= " where ";
1647                                             $sSQL .= "ST_Contains('".$sPlaceGeom."', l.centroid) ";
1648                                         }
1649                                         if (sizeof($this->aExcludePlaceIDs)) {
1650                                             $sSQL .= " and l.place_id not in (".join(',', $this->aExcludePlaceIDs).")";
1651                                         }
1652                                         if ($sCountryCodesSQL) $sSQL .= " and lp.country_code in ($sCountryCodesSQL)";
1653                                         $sSQL .= 'limit 300) i ';
1654                                         if ($sOrderBySQL) $sSQL .= "order by order_term asc";
1655                                         if ($this->iOffset) $sSQL .= " offset $this->iOffset";
1656                                         $sSQL .= " limit $this->iLimit";
1657                                         if (CONST_Debug) var_dump($sSQL);
1658                                         $aClassPlaceIDs = array_merge($aClassPlaceIDs, chksql($this->oDB->getCol($sSQL)));
1659                                     } else {
1660                                         if ($aSearch['oNear']) {
1661                                             $fRange = $aSearch['oNear']->radius();
1662                                         }
1663
1664                                         $sOrderBySQL = '';
1665                                         if ($oNearPoint) {
1666                                             $sOrderBySQL = $oNearPoint->distanceSQL('l.geometry');
1667                                         } else {
1668                                             $sOrderBySQL = "ST_Distance(l.geometry, f.geometry)";
1669                                         }
1670
1671                                         $sSQL = "SELECT distinct l.place_id".($sOrderBySQL?','.$sOrderBySQL:'');
1672                                         $sSQL .= " FROM placex as l, placex as f ";
1673                                         $sSQL .= " WHERE f.place_id in ($sPlaceIDs) ";
1674                                         $sSQL .= "  AND ST_DWithin(l.geometry, f.centroid, $fRange) ";
1675                                         $sSQL .= "  AND l.class='".$aSearch['sClass']."' ";
1676                                         $sSQL .= "  AND l.type='".$aSearch['sType']."' ";
1677                                         if (sizeof($this->aExcludePlaceIDs)) {
1678                                             $sSQL .= " AND l.place_id not in (".join(',', $this->aExcludePlaceIDs).")";
1679                                         }
1680                                         if ($sCountryCodesSQL) $sSQL .= " AND l.country_code in ($sCountryCodesSQL)";
1681                                         if ($sOrderBySQL) $sSQL .= "ORDER BY ".$sOrderBySQL." ASC";
1682                                         if ($this->iOffset) $sSQL .= " OFFSET $this->iOffset";
1683                                         $sSQL .= " limit $this->iLimit";
1684                                         if (CONST_Debug) var_dump($sSQL);
1685                                         $aClassPlaceIDs = array_merge($aClassPlaceIDs, chksql($this->oDB->getCol($sSQL)));
1686                                     }
1687                                 }
1688                             }
1689                             $aPlaceIDs = $aClassPlaceIDs;
1690                         }
1691                     }
1692
1693                     if (CONST_Debug) {
1694                         echo "<br><b>Place IDs:</b> ";
1695                         var_Dump($aPlaceIDs);
1696                     }
1697
1698                     if (sizeof($aPlaceIDs) && $aSearch['sPostcode']) {
1699                         $sSQL = 'SELECT place_id FROM placex';
1700                         $sSQL .= ' WHERE place_id in ('.join(',', $aPlaceIDs).')';
1701                         $sSQL .= " AND postcode = '".pg_escape_string($aSearch['sPostcode'])."'";
1702                         if (CONST_Debug) var_dump($sSQL);
1703                         $aFilteredPlaceIDs = chksql($this->oDB->getCol($sSQL));
1704                         if ($aFilteredPlaceIDs) {
1705                             $aPlaceIDs = $aFilteredPlaceIDs;
1706                             if (CONST_Debug) {
1707                                 echo "<br><b>Place IDs after postcode filtering:</b> ";
1708                                 var_Dump($aPlaceIDs);
1709                             }
1710                         }
1711                     }
1712
1713                     foreach ($aPlaceIDs as $iPlaceID) {
1714                         // array for placeID => -1 | Tiger housenumber
1715                         $aResultPlaceIDs[$iPlaceID] = $searchedHousenumber;
1716                     }
1717                     if ($iQueryLoop > 20) break;
1718                 }
1719
1720                 if (isset($aResultPlaceIDs) && sizeof($aResultPlaceIDs) && ($this->iMinAddressRank != 0 || $this->iMaxAddressRank != 30)) {
1721                     // Need to verify passes rank limits before dropping out of the loop (yuk!)
1722                     // reduces the number of place ids, like a filter
1723                     // rank_address is 30 for interpolated housenumbers
1724                     $sWherePlaceId = 'WHERE place_id in (';
1725                     $sWherePlaceId .= join(',', array_keys($aResultPlaceIDs)).') ';
1726
1727                     $sSQL = "SELECT place_id ";
1728                     $sSQL .= "FROM placex ".$sWherePlaceId;
1729                     $sSQL .= "  AND (";
1730                     $sSQL .= "         placex.rank_address between $this->iMinAddressRank and $this->iMaxAddressRank ";
1731                     if (14 >= $this->iMinAddressRank && 14 <= $this->iMaxAddressRank) {
1732                         $sSQL .= "     OR (extratags->'place') = 'city'";
1733                     }
1734                     if ($this->aAddressRankList) {
1735                         $sSQL .= "     OR placex.rank_address in (".join(',', $this->aAddressRankList).")";
1736                     }
1737                     $sSQL .= "  ) UNION ";
1738                     $sSQL .= " SELECT place_id FROM location_postcode lp ".$sWherePlaceId;
1739                     $sSQL .= "  AND (lp.rank_address between $this->iMinAddressRank and $this->iMaxAddressRank ";
1740                     if ($this->aAddressRankList) {
1741                         $sSQL .= "     OR lp.rank_address in (".join(',', $this->aAddressRankList).")";
1742                     }
1743                     $sSQL .= ") ";
1744                     if (CONST_Use_US_Tiger_Data && $this->iMaxAddressRank == 30) {
1745                         $sSQL .= "UNION ";
1746                         $sSQL .= "  SELECT place_id ";
1747                         $sSQL .= "  FROM location_property_tiger ".$sWherePlaceId;
1748                     }
1749                     if ($this->iMaxAddressRank == 30) {
1750                         $sSQL .= "UNION ";
1751                         $sSQL .= "  SELECT place_id ";
1752                         $sSQL .= "  FROM location_property_osmline ".$sWherePlaceId;
1753                     }
1754                     if (CONST_Debug) var_dump($sSQL);
1755                     $aFilteredPlaceIDs = chksql($this->oDB->getCol($sSQL));
1756                     $tempIDs = array();
1757                     foreach ($aFilteredPlaceIDs as $placeID) {
1758                         $tempIDs[$placeID] = $aResultPlaceIDs[$placeID];  //assign housenumber to placeID
1759                     }
1760                     $aResultPlaceIDs = $tempIDs;
1761                 }
1762
1763                 //exit;
1764                 if (isset($aResultPlaceIDs) && sizeof($aResultPlaceIDs)) break;
1765                 if ($iGroupLoop > 4) break;
1766                 if ($iQueryLoop > 30) break;
1767             }
1768
1769             // Did we find anything?
1770             if (isset($aResultPlaceIDs) && sizeof($aResultPlaceIDs)) {
1771                 $aSearchResults = $this->getDetails($aResultPlaceIDs);
1772             }
1773         } else {
1774             // Just interpret as a reverse geocode
1775             $oReverse = new ReverseGeocode($this->oDB);
1776             $oReverse->setZoom(18);
1777
1778             $aLookup = $oReverse->lookup(
1779                 $oNearPoint->lat(),
1780                 $oNearPoint->lon(),
1781                 false
1782             );
1783
1784             if (CONST_Debug) var_dump("Reverse search", $aLookup);
1785
1786             if ($aLookup['place_id']) {
1787                 $aSearchResults = $this->getDetails(array($aLookup['place_id'] => -1));
1788                 $aResultPlaceIDs[$aLookup['place_id']] = -1;
1789             } else {
1790                 $aSearchResults = array();
1791             }
1792         }
1793
1794         // No results? Done
1795         if (!sizeof($aSearchResults)) {
1796             if ($this->bFallback) {
1797                 if ($this->fallbackStructuredQuery()) {
1798                     return $this->lookup();
1799                 }
1800             }
1801
1802             return array();
1803         }
1804
1805         $aClassType = getClassTypesWithImportance();
1806         $aRecheckWords = preg_split('/\b[\s,\\-]*/u', $sQuery);
1807         foreach ($aRecheckWords as $i => $sWord) {
1808             if (!preg_match('/[\pL\pN]/', $sWord)) unset($aRecheckWords[$i]);
1809         }
1810
1811         if (CONST_Debug) {
1812             echo '<i>Recheck words:<\i>';
1813             var_dump($aRecheckWords);
1814         }
1815
1816         $oPlaceLookup = new PlaceLookup($this->oDB);
1817         $oPlaceLookup->setIncludePolygonAsPoints($this->bIncludePolygonAsPoints);
1818         $oPlaceLookup->setIncludePolygonAsText($this->bIncludePolygonAsText);
1819         $oPlaceLookup->setIncludePolygonAsGeoJSON($this->bIncludePolygonAsGeoJSON);
1820         $oPlaceLookup->setIncludePolygonAsKML($this->bIncludePolygonAsKML);
1821         $oPlaceLookup->setIncludePolygonAsSVG($this->bIncludePolygonAsSVG);
1822         $oPlaceLookup->setPolygonSimplificationThreshold($this->fPolygonSimplificationThreshold);
1823
1824         foreach ($aSearchResults as $iResNum => $aResult) {
1825             // Default
1826             $fDiameter = getResultDiameter($aResult);
1827
1828             $aOutlineResult = $oPlaceLookup->getOutlines($aResult['place_id'], $aResult['lon'], $aResult['lat'], $fDiameter/2);
1829             if ($aOutlineResult) {
1830                 $aResult = array_merge($aResult, $aOutlineResult);
1831             }
1832             
1833             if ($aResult['extra_place'] == 'city') {
1834                 $aResult['class'] = 'place';
1835                 $aResult['type'] = 'city';
1836                 $aResult['rank_search'] = 16;
1837             }
1838
1839             // Is there an icon set for this type of result?
1840             if (isset($aClassType[$aResult['class'].':'.$aResult['type']]['icon'])
1841                 && $aClassType[$aResult['class'].':'.$aResult['type']]['icon']
1842             ) {
1843                 $aResult['icon'] = CONST_Website_BaseURL.'images/mapicons/'.$aClassType[$aResult['class'].':'.$aResult['type']]['icon'].'.p.20.png';
1844             }
1845
1846             if (isset($aClassType[$aResult['class'].':'.$aResult['type'].':'.$aResult['admin_level']]['label'])
1847                 && $aClassType[$aResult['class'].':'.$aResult['type'].':'.$aResult['admin_level']]['label']
1848             ) {
1849                 $aResult['label'] = $aClassType[$aResult['class'].':'.$aResult['type'].':'.$aResult['admin_level']]['label'];
1850             } elseif (isset($aClassType[$aResult['class'].':'.$aResult['type']]['label'])
1851                 && $aClassType[$aResult['class'].':'.$aResult['type']]['label']
1852             ) {
1853                 $aResult['label'] = $aClassType[$aResult['class'].':'.$aResult['type']]['label'];
1854             }
1855             // if tag '&addressdetails=1' is set in query
1856             if ($this->bIncludeAddressDetails) {
1857                 // getAddressDetails() is defined in lib.php and uses the SQL function get_addressdata in functions.sql
1858                 $aResult['address'] = getAddressDetails($this->oDB, $sLanguagePrefArraySQL, $aResult['place_id'], $aResult['country_code'], $aResultPlaceIDs[$aResult['place_id']]);
1859                 if ($aResult['extra_place'] == 'city' && !isset($aResult['address']['city'])) {
1860                     $aResult['address'] = array_merge(array('city' => array_values($aResult['address'])[0]), $aResult['address']);
1861                 }
1862             }
1863
1864             if ($this->bIncludeExtraTags) {
1865                 if ($aResult['extra']) {
1866                     $aResult['sExtraTags'] = json_decode($aResult['extra']);
1867                 } else {
1868                     $aResult['sExtraTags'] = (object) array();
1869                 }
1870             }
1871
1872             if ($this->bIncludeNameDetails) {
1873                 if ($aResult['names']) {
1874                     $aResult['sNameDetails'] = json_decode($aResult['names']);
1875                 } else {
1876                     $aResult['sNameDetails'] = (object) array();
1877                 }
1878             }
1879
1880             // Adjust importance for the number of exact string matches in the result
1881             $aResult['importance'] = max(0.001, $aResult['importance']);
1882             $iCountWords = 0;
1883             $sAddress = $aResult['langaddress'];
1884             foreach ($aRecheckWords as $i => $sWord) {
1885                 if (stripos($sAddress, $sWord)!==false) {
1886                     $iCountWords++;
1887                     if (preg_match("/(^|,)\s*".preg_quote($sWord, '/')."\s*(,|$)/", $sAddress)) $iCountWords += 0.1;
1888                 }
1889             }
1890
1891             $aResult['importance'] = $aResult['importance'] + ($iCountWords*0.1); // 0.1 is a completely arbitrary number but something in the range 0.1 to 0.5 would seem right
1892
1893             $aResult['name'] = $aResult['langaddress'];
1894             // secondary ordering (for results with same importance (the smaller the better):
1895             // - approximate importance of address parts
1896             $aResult['foundorder'] = -$aResult['addressimportance']/10;
1897             // - number of exact matches from the query
1898             if (isset($this->exactMatchCache[$aResult['place_id']])) {
1899                 $aResult['foundorder'] -= $this->exactMatchCache[$aResult['place_id']];
1900             } elseif (isset($this->exactMatchCache[$aResult['parent_place_id']])) {
1901                 $aResult['foundorder'] -= $this->exactMatchCache[$aResult['parent_place_id']];
1902             }
1903             // - importance of the class/type
1904             if (isset($aClassType[$aResult['class'].':'.$aResult['type']]['importance'])
1905                 && $aClassType[$aResult['class'].':'.$aResult['type']]['importance']
1906             ) {
1907                 $aResult['foundorder'] += 0.0001 * $aClassType[$aResult['class'].':'.$aResult['type']]['importance'];
1908             } else {
1909                 $aResult['foundorder'] += 0.01;
1910             }
1911             if (CONST_Debug) var_dump($aResult);
1912             $aSearchResults[$iResNum] = $aResult;
1913         }
1914         uasort($aSearchResults, 'byImportance');
1915
1916         $aOSMIDDone = array();
1917         $aClassTypeNameDone = array();
1918         $aToFilter = $aSearchResults;
1919         $aSearchResults = array();
1920
1921         $bFirst = true;
1922         foreach ($aToFilter as $iResNum => $aResult) {
1923             $this->aExcludePlaceIDs[$aResult['place_id']] = $aResult['place_id'];
1924             if ($bFirst) {
1925                 $fLat = $aResult['lat'];
1926                 $fLon = $aResult['lon'];
1927                 if (isset($aResult['zoom'])) $iZoom = $aResult['zoom'];
1928                 $bFirst = false;
1929             }
1930             if (!$this->bDeDupe || (!isset($aOSMIDDone[$aResult['osm_type'].$aResult['osm_id']])
1931                 && !isset($aClassTypeNameDone[$aResult['osm_type'].$aResult['class'].$aResult['type'].$aResult['name'].$aResult['admin_level']]))
1932             ) {
1933                 $aOSMIDDone[$aResult['osm_type'].$aResult['osm_id']] = true;
1934                 $aClassTypeNameDone[$aResult['osm_type'].$aResult['class'].$aResult['type'].$aResult['name'].$aResult['admin_level']] = true;
1935                 $aSearchResults[] = $aResult;
1936             }
1937
1938             // Absolute limit on number of results
1939             if (sizeof($aSearchResults) >= $this->iFinalLimit) break;
1940         }
1941
1942         return $aSearchResults;
1943     } // end lookup()
1944 } // end class