]> git.openstreetmap.org Git - nominatim.git/blob - lib/Geocode.php
Merge pull request #420 from lonvia/remove-explicit-software-versions
[nominatim.git] / lib / Geocode.php
1 <?php
2         require_once(CONST_BasePath.'/lib/PlaceLookup.php');
3
4         class Geocode
5         {
6                 protected $oDB;
7
8                 protected $aLangPrefOrder = array();
9
10                 protected $bIncludeAddressDetails = false;
11                 protected $bIncludeExtraTags = false;
12                 protected $bIncludeNameDetails = false;
13
14                 protected $bIncludePolygonAsPoints = false;
15                 protected $bIncludePolygonAsText = false;
16                 protected $bIncludePolygonAsGeoJSON = false;
17                 protected $bIncludePolygonAsKML = false;
18                 protected $bIncludePolygonAsSVG = false;
19                 protected $fPolygonSimplificationThreshold = 0.0;
20
21                 protected $aExcludePlaceIDs = array();
22                 protected $bDeDupe = true;
23                 protected $bReverseInPlan = false;
24
25                 protected $iLimit = 20;
26                 protected $iFinalLimit = 10;
27                 protected $iOffset = 0;
28                 protected $bFallback = false;
29
30                 protected $aCountryCodes = false;
31                 protected $aNearPoint = false;
32
33                 protected $bBoundedSearch = false;
34                 protected $aViewBox = false;
35                 protected $sViewboxSmallSQL = false;
36                 protected $sViewboxLargeSQL = false;
37                 protected $aRoutePoints = false;
38
39                 protected $iMaxRank = 20;
40                 protected $iMinAddressRank = 0;
41                 protected $iMaxAddressRank = 30;
42                 protected $aAddressRankList = array();
43                 protected $exactMatchCache = array();
44
45                 protected $sAllowedTypesSQLList = false;
46
47                 protected $sQuery = false;
48                 protected $aStructuredQuery = false;
49
50                 function Geocode(&$oDB)
51                 {
52                         $this->oDB =& $oDB;
53                 }
54
55                 function setReverseInPlan($bReverse)
56                 {
57                         $this->bReverseInPlan = $bReverse;
58                 }
59
60                 function setLanguagePreference($aLangPref)
61                 {
62                         $this->aLangPrefOrder = $aLangPref;
63                 }
64
65                 function setIncludeAddressDetails($bAddressDetails = true)
66                 {
67                         $this->bIncludeAddressDetails = (bool)$bAddressDetails;
68                 }
69
70                 function getIncludeAddressDetails()
71                 {
72                         return $this->bIncludeAddressDetails;
73                 }
74
75                 function getIncludeExtraTags()
76                 {
77                         return $this->bIncludeExtraTags;
78                 }
79
80                 function getIncludeNameDetails()
81                 {
82                         return $this->bIncludeNameDetails;
83                 }
84
85                 function setIncludePolygonAsPoints($b = true)
86                 {
87                         $this->bIncludePolygonAsPoints = $b;
88                 }
89
90                 function getIncludePolygonAsPoints()
91                 {
92                         return $this->bIncludePolygonAsPoints;
93                 }
94
95                 function setIncludePolygonAsText($b = true)
96                 {
97                         $this->bIncludePolygonAsText = $b;
98                 }
99
100                 function getIncludePolygonAsText()
101                 {
102                         return $this->bIncludePolygonAsText;
103                 }
104
105                 function setIncludePolygonAsGeoJSON($b = true)
106                 {
107                         $this->bIncludePolygonAsGeoJSON = $b;
108                 }
109
110                 function setIncludePolygonAsKML($b = true)
111                 {
112                         $this->bIncludePolygonAsKML = $b;
113                 }
114
115                 function setIncludePolygonAsSVG($b = true)
116                 {
117                         $this->bIncludePolygonAsSVG = $b;
118                 }
119
120                 function setPolygonSimplificationThreshold($f)
121                 {
122                         $this->fPolygonSimplificationThreshold = $f;
123                 }
124
125                 function setDeDupe($bDeDupe = true)
126                 {
127                         $this->bDeDupe = (bool)$bDeDupe;
128                 }
129
130                 function setLimit($iLimit = 10)
131                 {
132                         if ($iLimit > 50) $iLimit = 50;
133                         if ($iLimit < 1) $iLimit = 1;
134
135                         $this->iFinalLimit = $iLimit;
136                         $this->iLimit = $this->iFinalLimit + min($this->iFinalLimit, 10);
137                 }
138
139                 function setOffset($iOffset = 0)
140                 {
141                         $this->iOffset = $iOffset;
142                 }
143
144                 function setFallback($bFallback = true)
145                 {
146                         $this->bFallback = (bool)$bFallback;
147                 }
148
149                 function setExcludedPlaceIDs($a)
150                 {
151                         // TODO: force to int
152                         $this->aExcludePlaceIDs = $a;
153                 }
154
155                 function getExcludedPlaceIDs()
156                 {
157                         return $this->aExcludePlaceIDs;
158                 }
159
160                 function setBounded($bBoundedSearch = true)
161                 {
162                         $this->bBoundedSearch = (bool)$bBoundedSearch;
163                 }
164
165                 function setViewBox($fLeft, $fBottom, $fRight, $fTop)
166                 {
167                         $this->aViewBox = array($fLeft, $fBottom, $fRight, $fTop);
168                 }
169
170                 function getViewBoxString()
171                 {
172                         if (!$this->aViewBox) return null;
173                         return $this->aViewBox[0].','.$this->aViewBox[3].','.$this->aViewBox[2].','.$this->aViewBox[1];
174                 }
175
176                 function setRoute($aRoutePoints)
177                 {
178                         $this->aRoutePoints = $aRoutePoints;
179                 }
180
181                 function setFeatureType($sFeatureType)
182                 {
183                         switch($sFeatureType)
184                         {
185                         case 'country':
186                                 $this->setRankRange(4, 4);
187                                 break;
188                         case 'state':
189                                 $this->setRankRange(8, 8);
190                                 break;
191                         case 'city':
192                                 $this->setRankRange(14, 16);
193                                 break;
194                         case 'settlement':
195                                 $this->setRankRange(8, 20);
196                                 break;
197                         }
198                 }
199
200                 function setRankRange($iMin, $iMax)
201                 {
202                         $this->iMinAddressRank = (int)$iMin;
203                         $this->iMaxAddressRank = (int)$iMax;
204                 }
205
206                 function setNearPoint($aNearPoint, $fRadiusDeg = 0.1)
207                 {
208                         $this->aNearPoint = array((float)$aNearPoint[0], (float)$aNearPoint[1], (float)$fRadiusDeg);
209                 }
210
211                 function setCountryCodesList($aCountryCodes)
212                 {
213                         $this->aCountryCodes = $aCountryCodes;
214                 }
215
216                 function setQuery($sQueryString)
217                 {
218                         $this->sQuery = $sQueryString;
219                         $this->aStructuredQuery = false;
220                 }
221
222                 function getQueryString()
223                 {
224                         return $this->sQuery;
225                 }
226
227
228                 function loadParamArray($aParams)
229                 {
230                         if (isset($aParams['addressdetails'])) $this->bIncludeAddressDetails = (bool)$aParams['addressdetails'];
231                         if (isset($aParams['extratags'])) $this->bIncludeExtraTags = (bool)$aParams['extratags'];
232                         if (isset($aParams['namedetails'])) $this->bIncludeNameDetails = (bool)$aParams['namedetails'];
233
234                         if (isset($aParams['bounded'])) $this->bBoundedSearch = (bool)$aParams['bounded'];
235                         if (isset($aParams['dedupe'])) $this->bDeDupe = (bool)$aParams['dedupe'];
236
237                         if (isset($aParams['limit'])) $this->setLimit((int)$aParams['limit']);
238                         if (isset($aParams['offset'])) $this->iOffset = (int)$aParams['offset'];
239
240                         if (isset($aParams['fallback'])) $this->bFallback = (bool)$aParams['fallback'];
241
242                         // List of excluded Place IDs - used for more acurate pageing
243                         if (isset($aParams['exclude_place_ids']) && $aParams['exclude_place_ids'])
244                         {
245                                 foreach(explode(',',$aParams['exclude_place_ids']) as $iExcludedPlaceID)
246                                 {
247                                         $iExcludedPlaceID = (int)$iExcludedPlaceID;
248                                         if ($iExcludedPlaceID)
249                                                 $aExcludePlaceIDs[$iExcludedPlaceID] = $iExcludedPlaceID;
250                                 }
251
252                                 if (isset($aExcludePlaceIDs))
253                                         $this->aExcludePlaceIDs = $aExcludePlaceIDs;
254                         }
255
256                         // Only certain ranks of feature
257                         if (isset($aParams['featureType'])) $this->setFeatureType($aParams['featureType']);
258                         if (isset($aParams['featuretype'])) $this->setFeatureType($aParams['featuretype']);
259
260                         // Country code list
261                         if (isset($aParams['countrycodes']))
262                         {
263                                 $aCountryCodes = array();
264                                 foreach(explode(',',$aParams['countrycodes']) as $sCountryCode)
265                                 {
266                                         if (preg_match('/^[a-zA-Z][a-zA-Z]$/', $sCountryCode))
267                                         {
268                                                 $aCountryCodes[] = strtolower($sCountryCode);
269                                         }
270                                 }
271                                 $this->aCountryCodes = $aCountryCodes;
272                         }
273
274                         if (isset($aParams['viewboxlbrt']) && $aParams['viewboxlbrt'])
275                         {
276                                 $aCoOrdinatesLBRT = explode(',',$aParams['viewboxlbrt']);
277                                 $this->setViewBox($aCoOrdinatesLBRT[0], $aCoOrdinatesLBRT[1], $aCoOrdinatesLBRT[2], $aCoOrdinatesLBRT[3]);
278                         }
279                         else if (isset($aParams['viewbox']) && $aParams['viewbox'])
280                         {
281                                 $aCoOrdinatesLTRB = explode(',',$aParams['viewbox']);
282                                 $this->setViewBox($aCoOrdinatesLTRB[0], $aCoOrdinatesLTRB[3], $aCoOrdinatesLTRB[2], $aCoOrdinatesLTRB[1]);
283                         }
284
285                         if (isset($aParams['route']) && $aParams['route'] && isset($aParams['routewidth']) && $aParams['routewidth'])
286                         {
287                                 $aPoints = explode(',',$aParams['route']);
288                                 if (sizeof($aPoints) % 2 != 0)
289                                 {
290                                         userError("Uneven number of points");
291                                         exit;
292                                 }
293                                 $fPrevCoord = false;
294                                 $aRoute = array();
295                                 foreach($aPoints as $i => $fPoint)
296                                 {
297                                         if ($i%2)
298                                         {
299                                                 $aRoute[] = array((float)$fPoint, $fPrevCoord);
300                                         }
301                                         else
302                                         {
303                                                 $fPrevCoord = (float)$fPoint;
304                                         }
305                                 }
306                                 $this->aRoutePoints = $aRoute;
307                         }
308                 }
309
310                 function setQueryFromParams($aParams)
311                 {
312                         // Search query
313                         $sQuery = (isset($aParams['q'])?trim($aParams['q']):'');
314                         if (!$sQuery)
315                         {
316                                 $this->setStructuredQuery(@$aParams['amenity'], @$aParams['street'], @$aParams['city'], @$aParams['county'], @$aParams['state'], @$aParams['country'], @$aParams['postalcode']);
317                                 $this->setReverseInPlan(false);
318                         }
319                         else
320                         {
321                                 $this->setQuery($sQuery);
322                         }
323                 }
324
325                 function loadStructuredAddressElement($sValue, $sKey, $iNewMinAddressRank, $iNewMaxAddressRank, $aItemListValues)
326                 {
327                         $sValue = trim($sValue);
328                         if (!$sValue) return false;
329                         $this->aStructuredQuery[$sKey] = $sValue;
330                         if ($this->iMinAddressRank == 0 && $this->iMaxAddressRank == 30)
331                         {
332                                 $this->iMinAddressRank = $iNewMinAddressRank;
333                                 $this->iMaxAddressRank = $iNewMaxAddressRank;
334                         }
335                         if ($aItemListValues) $this->aAddressRankList = array_merge($this->aAddressRankList, $aItemListValues);
336                         return true;
337                 }
338
339                 function setStructuredQuery($sAmentiy = false, $sStreet = false, $sCity = false, $sCounty = false, $sState = false, $sCountry = false, $sPostalCode = false)
340                 {
341                         $this->sQuery = false;
342
343                         // Reset
344                         $this->iMinAddressRank = 0;
345                         $this->iMaxAddressRank = 30;
346                         $this->aAddressRankList = array();
347
348                         $this->aStructuredQuery = array();
349                         $this->sAllowedTypesSQLList = '';
350
351                         $this->loadStructuredAddressElement($sAmentiy, 'amenity', 26, 30, false);
352                         $this->loadStructuredAddressElement($sStreet, 'street', 26, 30, false);
353                         $this->loadStructuredAddressElement($sCity, 'city', 14, 24, false);
354                         $this->loadStructuredAddressElement($sCounty, 'county', 9, 13, false);
355                         $this->loadStructuredAddressElement($sState, 'state', 8, 8, false);
356                         $this->loadStructuredAddressElement($sPostalCode, 'postalcode' , 5, 11, array(5, 11));
357                         $this->loadStructuredAddressElement($sCountry, 'country', 4, 4, false);
358
359                         if (sizeof($this->aStructuredQuery) > 0)
360                         {
361                                 $this->sQuery = join(', ', $this->aStructuredQuery);
362                                 if ($this->iMaxAddressRank < 30)
363                                 {
364                                         $sAllowedTypesSQLList = '(\'place\',\'boundary\')';
365                                 }
366                         }
367                 }
368
369                 function fallbackStructuredQuery()
370                 {
371                         if (!$this->aStructuredQuery) return false;
372
373                         $aParams = $this->aStructuredQuery;
374
375                         if (sizeof($aParams) == 1) return false;
376
377                         $aOrderToFallback = array('postalcode', 'street', 'city', 'county', 'state');
378
379                         foreach($aOrderToFallback as $sType)
380                         {
381                                 if (isset($aParams[$sType]))
382                                 {
383                                         unset($aParams[$sType]);
384                                         $this->setStructuredQuery(@$aParams['amenity'], @$aParams['street'], @$aParams['city'], @$aParams['county'], @$aParams['state'], @$aParams['country'], @$aParams['postalcode']);
385                                         return true;
386                                 }
387                         }
388
389                         return false;
390                 }
391
392                 function getDetails($aPlaceIDs)
393                 {
394                         //$aPlaceIDs is an array with key: placeID and value: tiger-housenumber, if found, else -1
395                         if (sizeof($aPlaceIDs) == 0)  return array();
396
397                         $sLanguagePrefArraySQL = "ARRAY[".join(',',array_map("getDBQuoted",$this->aLangPrefOrder))."]";
398
399                         // Get the details for display (is this a redundant extra step?)
400                         $sPlaceIDs = join(',', array_keys($aPlaceIDs));
401
402                         $sImportanceSQL = '';
403                         if ($this->sViewboxSmallSQL) $sImportanceSQL .= " case when ST_Contains($this->sViewboxSmallSQL, ST_Collect(centroid)) THEN 1 ELSE 0.75 END * ";
404                         if ($this->sViewboxLargeSQL) $sImportanceSQL .= " case when ST_Contains($this->sViewboxLargeSQL, ST_Collect(centroid)) THEN 1 ELSE 0.75 END * ";
405
406                         $sSQL = "select osm_type,osm_id,class,type,admin_level,rank_search,rank_address,min(place_id) as place_id, min(parent_place_id) as parent_place_id, calculated_country_code as country_code,";
407                         $sSQL .= "get_address_by_language(place_id, -1, $sLanguagePrefArraySQL) as langaddress,";
408                         $sSQL .= "get_name_by_language(name, $sLanguagePrefArraySQL) as placename,";
409                         $sSQL .= "get_name_by_language(name, ARRAY['ref']) as ref,";
410                         if ($this->bIncludeExtraTags) $sSQL .= "hstore_to_json(extratags)::text as extra,";
411                         if ($this->bIncludeNameDetails) $sSQL .= "hstore_to_json(name)::text as names,";
412                         $sSQL .= "avg(ST_X(centroid)) as lon,avg(ST_Y(centroid)) as lat, ";
413                         $sSQL .= $sImportanceSQL."coalesce(importance,0.75-(rank_search::float/40)) as importance, ";
414                         $sSQL .= "(select max(p.importance*(p.rank_address+2)) from place_addressline s, placex p where s.place_id = min(CASE WHEN placex.rank_search < 28 THEN placex.place_id ELSE placex.parent_place_id END) and p.place_id = s.address_place_id and s.isaddress and p.importance is not null) as addressimportance, ";
415                         $sSQL .= "(extratags->'place') as extra_place ";
416                         $sSQL .= "from placex where place_id in ($sPlaceIDs) ";
417                         $sSQL .= "and (placex.rank_address between $this->iMinAddressRank and $this->iMaxAddressRank ";
418                         if (14 >= $this->iMinAddressRank && 14 <= $this->iMaxAddressRank) $sSQL .= " OR (extratags->'place') = 'city'";
419                         if ($this->aAddressRankList) $sSQL .= " OR placex.rank_address in (".join(',',$this->aAddressRankList).")";
420                         $sSQL .= ") ";
421                         if ($this->sAllowedTypesSQLList) $sSQL .= "and placex.class in $this->sAllowedTypesSQLList ";
422                         $sSQL .= "and linked_place_id is null ";
423                         $sSQL .= "group by osm_type,osm_id,class,type,admin_level,rank_search,rank_address,calculated_country_code,importance";
424                         if (!$this->bDeDupe) $sSQL .= ",place_id";
425                         $sSQL .= ",langaddress ";
426                         $sSQL .= ",placename ";
427                         $sSQL .= ",ref ";
428                         if ($this->bIncludeExtraTags) $sSQL .= ",extratags";
429                         if ($this->bIncludeNameDetails) $sSQL .= ",name";
430                         $sSQL .= ",extratags->'place' ";
431
432                         if (30 >= $this->iMinAddressRank && 30 <= $this->iMaxAddressRank)
433                         {
434                                 //query also location_property_tiger and location_property_aux
435                                 //Tiger search only if a housenumber was searched and if it was found (i.e. aPlaceIDs[placeID] = housenumber != -1) (realized through a join)
436                                 //only Tiger housenumbers need to be interpolated, because they are saved as lines with start- and endnumber, the common osm housenumbers are usually saved as points
437                                 $sHousenumbers = "";
438                                 $i = 0;
439                                 $length = count($aPlaceIDs);
440                                 foreach($aPlaceIDs as $placeID => $housenumber)
441                 {
442                                         $i++;
443                                         $sHousenumbers .= "(".$placeID.", ".$housenumber.")";
444                                         if($i<$length)
445                                                 $sHousenumbers .= ", ";
446                                 }
447
448                                 $sSQL .= "union ";
449                                 $sSQL .= "select 'T' as osm_type, place_id as osm_id, 'place' as class, 'house' as type, null as admin_level, 30 as rank_search, 30 as rank_address, min(place_id) as place_id, min(parent_place_id) as parent_place_id, 'us' as country_code";
450                                 $sSQL .= ", get_address_by_language(place_id, housenumber_for_place, $sLanguagePrefArraySQL) as langaddress ";
451                                 $sSQL .= ", null as placename";
452                                 $sSQL .= ", null as ref";
453                                 if ($this->bIncludeExtraTags) $sSQL .= ", null as extra";
454                                 if ($this->bIncludeNameDetails) $sSQL .= ", null as names";
455                                 $sSQL .= ", avg(st_x(centroid)) as lon, avg(st_y(centroid)) as lat,";
456                                 $sSQL .= $sImportanceSQL."-1.15 as importance ";
457                                 $sSQL .= ", (select max(p.importance*(p.rank_address+2)) from place_addressline s, placex p where s.place_id = min(blub.parent_place_id) and p.place_id = s.address_place_id and s.isaddress and p.importance is not null) as addressimportance ";
458                                 $sSQL .= ", null as extra_place ";
459                                 $sSQL .= " from (select place_id";
460                                 //interpolate the Tiger housenumbers here
461                                 $sSQL .= ", ST_LineInterpolatePoint(linegeo, (housenumber_for_place-startnumber::float)/(endnumber-startnumber)::float) as centroid, parent_place_id, housenumber_for_place ";
462                                 $sSQL .= "from (location_property_tiger ";
463                                 $sSQL .= " join (values ".$sHousenumbers.") as housenumbers(place_id, housenumber_for_place) using(place_id)) ";
464                                 $sSQL .= " where housenumber_for_place>=0 and 30 between $this->iMinAddressRank and $this->iMaxAddressRank) as blub"; //postgres wants an alias here
465                                 $sSQL .= " group by place_id, housenumber_for_place"; //is this group by really needed?, place_id + housenumber (in combination) are unique
466                                 if (!$this->bDeDupe) $sSQL .= ", place_id ";
467
468                                 $sSQL .= " union ";
469                                 $sSQL .= "select 'L' as osm_type, place_id as osm_id, 'place' as class, 'house' as type, null as admin_level, 0 as rank_search, 0 as rank_address, min(place_id) as place_id, min(parent_place_id) as parent_place_id, 'us' as country_code, ";
470                                 $sSQL .= "get_address_by_language(place_id, -1, $sLanguagePrefArraySQL) as langaddress, ";
471                                 $sSQL .= "null as placename, ";
472                                 $sSQL .= "null as ref, ";
473                                 if ($this->bIncludeExtraTags) $sSQL .= "null as extra, ";
474                                 if ($this->bIncludeNameDetails) $sSQL .= "null as names, ";
475                                 $sSQL .= "avg(ST_X(centroid)) as lon, avg(ST_Y(centroid)) as lat, ";
476                                 $sSQL .= $sImportanceSQL."-1.10 as importance, ";
477                                 $sSQL .= "(select max(p.importance*(p.rank_address+2)) from place_addressline s, placex p where s.place_id = min(location_property_aux.parent_place_id) and p.place_id = s.address_place_id and s.isaddress and p.importance is not null) as addressimportance, ";
478                                 $sSQL .= "null as extra_place ";
479                                 $sSQL .= "from location_property_aux where place_id in ($sPlaceIDs) ";
480                                 $sSQL .= "and 30 between $this->iMinAddressRank and $this->iMaxAddressRank ";
481                                 $sSQL .= "group by place_id";
482                                 if (!$this->bDeDupe) $sSQL .= ", place_id";
483                                 $sSQL .= ", get_address_by_language(place_id, -1, $sLanguagePrefArraySQL) ";
484                         }
485
486                         $sSQL .= " order by importance desc";
487                         if (CONST_Debug) { echo "<hr>"; var_dump($sSQL); }
488                         $aSearchResults = $this->oDB->getAll($sSQL);
489
490                         if (PEAR::IsError($aSearchResults))
491                         {
492                                 failInternalError("Could not get details for place.", $sSQL, $aSearchResults);
493                         }
494
495                         return $aSearchResults;
496                 }
497
498                 function getGroupedSearches($aSearches, $aPhraseTypes, $aPhrases, $aValidTokens, $aWordFrequencyScores, $bStructuredPhrases)
499                 {
500                         /*
501                                  Calculate all searches using aValidTokens i.e.
502                                  'Wodsworth Road, Sheffield' =>
503
504                                  Phrase Wordset
505                                  0      0       (wodsworth road)
506                                  0      1       (wodsworth)(road)
507                                  1      0       (sheffield)
508
509                                  Score how good the search is so they can be ordered
510                          */
511                         foreach($aPhrases as $iPhrase => $sPhrase)
512                         {
513                                 $aNewPhraseSearches = array();
514                                 if ($bStructuredPhrases) $sPhraseType = $aPhraseTypes[$iPhrase];
515                                 else $sPhraseType = '';
516
517                                 foreach($aPhrases[$iPhrase]['wordsets'] as $iWordSet => $aWordset)
518                                 {
519                                         // Too many permutations - too expensive
520                                         if ($iWordSet > 120) break;
521
522                                         $aWordsetSearches = $aSearches;
523
524                                         // Add all words from this wordset
525                                         foreach($aWordset as $iToken => $sToken)
526                                         {
527                                                 //echo "<br><b>$sToken</b>";
528                                                 $aNewWordsetSearches = array();
529
530                                                 foreach($aWordsetSearches as $aCurrentSearch)
531                                                 {
532                                                         //echo "<i>";
533                                                         //var_dump($aCurrentSearch);
534                                                         //echo "</i>";
535
536                                                         // If the token is valid
537                                                         if (isset($aValidTokens[' '.$sToken]))
538                                                         {
539                                                                 foreach($aValidTokens[' '.$sToken] as $aSearchTerm)
540                                                                 {
541                                                                         $aSearch = $aCurrentSearch;
542                                                                         $aSearch['iSearchRank']++;
543                                                                         if (($sPhraseType == '' || $sPhraseType == 'country') && !empty($aSearchTerm['country_code']) && $aSearchTerm['country_code'] != '0')
544                                                                         {
545                                                                                 if ($aSearch['sCountryCode'] === false)
546                                                                                 {
547                                                                                         $aSearch['sCountryCode'] = strtolower($aSearchTerm['country_code']);
548                                                                                         // Country is almost always at the end of the string - increase score for finding it anywhere else (optimisation)
549                                                                                         if (($iToken+1 != sizeof($aWordset) || $iPhrase+1 != sizeof($aPhrases)))
550                                                                                         {
551                                                                                                 $aSearch['iSearchRank'] += 5;
552                                                                                         }
553                                                                                         if ($aSearch['iSearchRank'] < $this->iMaxRank) $aNewWordsetSearches[] = $aSearch;
554                                                                                 }
555                                                                         }
556                                                                         elseif (isset($aSearchTerm['lat']) && $aSearchTerm['lat'] !== '' && $aSearchTerm['lat'] !== null)
557                                                                         {
558                                                                                 if ($aSearch['fLat'] === '')
559                                                                                 {
560                                                                                         $aSearch['fLat'] = $aSearchTerm['lat'];
561                                                                                         $aSearch['fLon'] = $aSearchTerm['lon'];
562                                                                                         $aSearch['fRadius'] = $aSearchTerm['radius'];
563                                                                                         if ($aSearch['iSearchRank'] < $this->iMaxRank) $aNewWordsetSearches[] = $aSearch;
564                                                                                 }
565                                                                         }
566                                                                         elseif ($sPhraseType == 'postalcode')
567                                                                         {
568                                                                                 // We need to try the case where the postal code is the primary element (i.e. no way to tell if it is (postalcode, city) OR (city, postalcode) so try both
569                                                                                 if (isset($aSearchTerm['word_id']) && $aSearchTerm['word_id'])
570                                                                                 {
571                                                                                         // If we already have a name try putting the postcode first
572                                                                                         if (sizeof($aSearch['aName']))
573                                                                                         {
574                                                                                                 $aNewSearch = $aSearch;
575                                                                                                 $aNewSearch['aAddress'] = array_merge($aNewSearch['aAddress'], $aNewSearch['aName']);
576                                                                                                 $aNewSearch['aName'] = array();
577                                                                                                 $aNewSearch['aName'][$aSearchTerm['word_id']] = $aSearchTerm['word_id'];
578                                                                                                 if ($aSearch['iSearchRank'] < $this->iMaxRank) $aNewWordsetSearches[] = $aNewSearch;
579                                                                                         }
580
581                                                                                         if (sizeof($aSearch['aName']))
582                                                                                         {
583                                                                                                 if ((!$bStructuredPhrases || $iPhrase > 0) && $sPhraseType != 'country' && (!isset($aValidTokens[$sToken]) || strpos($sToken, ' ') !== false))
584                                                                                                 {
585                                                                                                         $aSearch['aAddress'][$aSearchTerm['word_id']] = $aSearchTerm['word_id'];
586                                                                                                 }
587                                                                                                 else
588                                                                                                 {
589                                                                                                         $aCurrentSearch['aFullNameAddress'][$aSearchTerm['word_id']] = $aSearchTerm['word_id'];
590                                                                                                         $aSearch['iSearchRank'] += 1000; // skip;
591                                                                                                 }
592                                                                                         }
593                                                                                         else
594                                                                                         {
595                                                                                                 $aSearch['aName'][$aSearchTerm['word_id']] = $aSearchTerm['word_id'];
596                                                                                                 //$aSearch['iNamePhrase'] = $iPhrase;
597                                                                                         }
598                                                                                         if ($aSearch['iSearchRank'] < $this->iMaxRank) $aNewWordsetSearches[] = $aSearch;
599                                                                                 }
600
601                                                                         }
602                                                                         elseif (($sPhraseType == '' || $sPhraseType == 'street') && $aSearchTerm['class'] == 'place' && $aSearchTerm['type'] == 'house')
603                                                                         {
604                                                                                 if ($aSearch['sHouseNumber'] === '')
605                                                                                 {
606                                                                                         $aSearch['sHouseNumber'] = $sToken;
607                                                                                         // sanity check: if the housenumber is not mainly made
608                                                                                         // up of numbers, add a penalty
609                                                                                         if (preg_match_all("/[^0-9]/", $sToken, $aMatches) > 2) $aSearch['iSearchRank']++;
610                                                                                         // also housenumbers should appear in the first or second phrase
611                                                                                         if ($iPhrase > 1) $aSearch['iSearchRank'] += 1;
612                                                                                         if ($aSearch['iSearchRank'] < $this->iMaxRank) $aNewWordsetSearches[] = $aSearch;
613                                                                                         /*
614                                                                                         // Fall back to not searching for this item (better than nothing)
615                                                                                         $aSearch = $aCurrentSearch;
616                                                                                         $aSearch['iSearchRank'] += 1;
617                                                                                         if ($aSearch['iSearchRank'] < $this->iMaxRank) $aNewWordsetSearches[] = $aSearch;
618                                                                                          */
619                                                                                 }
620                                                                         }
621                                                                         elseif ($sPhraseType == '' && $aSearchTerm['class'] !== '' && $aSearchTerm['class'] !== null)
622                                                                         {
623                                                                                 if ($aSearch['sClass'] === '')
624                                                                                 {
625                                                                                         $aSearch['sOperator'] = $aSearchTerm['operator'];
626                                                                                         $aSearch['sClass'] = $aSearchTerm['class'];
627                                                                                         $aSearch['sType'] = $aSearchTerm['type'];
628                                                                                         if (sizeof($aSearch['aName'])) $aSearch['sOperator'] = 'name';
629                                                                                         else $aSearch['sOperator'] = 'near'; // near = in for the moment
630                                                                                         if (strlen($aSearchTerm['operator']) == 0) $aSearch['iSearchRank'] += 1;
631
632                                                                                         if ($aSearch['iSearchRank'] < $this->iMaxRank) $aNewWordsetSearches[] = $aSearch;
633                                                                                 }
634                                                                         }
635                                                                         elseif (isset($aSearchTerm['word_id']) && $aSearchTerm['word_id'])
636                                                                         {
637                                                                                 if (sizeof($aSearch['aName']))
638                                                                                 {
639                                                                                         if ((!$bStructuredPhrases || $iPhrase > 0) && $sPhraseType != 'country' && (!isset($aValidTokens[$sToken]) || strpos($sToken, ' ') !== false))
640                                                                                         {
641                                                                                                 $aSearch['aAddress'][$aSearchTerm['word_id']] = $aSearchTerm['word_id'];
642                                                                                         }
643                                                                                         else
644                                                                                         {
645                                                                                                 $aCurrentSearch['aFullNameAddress'][$aSearchTerm['word_id']] = $aSearchTerm['word_id'];
646                                                                                                 $aSearch['iSearchRank'] += 1000; // skip;
647                                                                                         }
648                                                                                 }
649                                                                                 else
650                                                                                 {
651                                                                                         $aSearch['aName'][$aSearchTerm['word_id']] = $aSearchTerm['word_id'];
652                                                                                         //$aSearch['iNamePhrase'] = $iPhrase;
653                                                                                 }
654                                                                                 if ($aSearch['iSearchRank'] < $this->iMaxRank) $aNewWordsetSearches[] = $aSearch;
655                                                                         }
656                                                                 }
657                                                         }
658                                                         // Look for partial matches.
659                                                         // Note that there is no point in adding country terms here
660                                                         // because country are omitted in the address.
661                                                         if (isset($aValidTokens[$sToken]) && $sPhraseType != 'country')
662                                                         {
663                                                                 // Allow searching for a word - but at extra cost
664                                                                 foreach($aValidTokens[$sToken] as $aSearchTerm)
665                                                                 {
666                                                                         if (isset($aSearchTerm['word_id']) && $aSearchTerm['word_id'])
667                                                                         {
668                                                                                 if ((!$bStructuredPhrases || $iPhrase > 0) && sizeof($aCurrentSearch['aName']) && strpos($sToken, ' ') === false)
669                                                                                 {
670                                                                                         $aSearch = $aCurrentSearch;
671                                                                                         $aSearch['iSearchRank'] += 1;
672                                                                                         if ($aWordFrequencyScores[$aSearchTerm['word_id']] < CONST_Max_Word_Frequency)
673                                                                                         {
674                                                                                                 $aSearch['aAddress'][$aSearchTerm['word_id']] = $aSearchTerm['word_id'];
675                                                                                                 if ($aSearch['iSearchRank'] < $this->iMaxRank) $aNewWordsetSearches[] = $aSearch;
676                                                                                         }
677                                                                                         elseif (isset($aValidTokens[' '.$sToken])) // revert to the token version?
678                                                                                         {
679                                                                                                 $aSearch['aAddressNonSearch'][$aSearchTerm['word_id']] = $aSearchTerm['word_id'];
680                                                                                                 $aSearch['iSearchRank'] += 1;
681                                                                                                 if ($aSearch['iSearchRank'] < $this->iMaxRank) $aNewWordsetSearches[] = $aSearch;
682                                                                                                 foreach($aValidTokens[' '.$sToken] as $aSearchTermToken)
683                                                                                                 {
684                                                                                                         if (empty($aSearchTermToken['country_code'])
685                                                                                                                         && empty($aSearchTermToken['lat'])
686                                                                                                                         && empty($aSearchTermToken['class']))
687                                                                                                         {
688                                                                                                                 $aSearch = $aCurrentSearch;
689                                                                                                                 $aSearch['iSearchRank'] += 1;
690                                                                                                                 $aSearch['aAddress'][$aSearchTermToken['word_id']] = $aSearchTermToken['word_id'];
691                                                                                                                 if ($aSearch['iSearchRank'] < $this->iMaxRank) $aNewWordsetSearches[] = $aSearch;
692                                                                                                         }
693                                                                                                 }
694                                                                                         }
695                                                                                         else
696                                                                                         {
697                                                                                                 $aSearch['aAddressNonSearch'][$aSearchTerm['word_id']] = $aSearchTerm['word_id'];
698                                                                                                 if (preg_match('#^[0-9]+$#', $sToken)) $aSearch['iSearchRank'] += 2;
699                                                                                                 if ($aSearch['iSearchRank'] < $this->iMaxRank) $aNewWordsetSearches[] = $aSearch;
700                                                                                         }
701                                                                                 }
702
703                                                                                 if (!sizeof($aCurrentSearch['aName']) || $aCurrentSearch['iNamePhrase'] == $iPhrase)
704                                                                                 {
705                                                                                         $aSearch = $aCurrentSearch;
706                                                                                         $aSearch['iSearchRank'] += 1;
707                                                                                         if (!sizeof($aCurrentSearch['aName'])) $aSearch['iSearchRank'] += 1;
708                                                                                         if (preg_match('#^[0-9]+$#', $sToken)) $aSearch['iSearchRank'] += 2;
709                                                                                         if ($aWordFrequencyScores[$aSearchTerm['word_id']] < CONST_Max_Word_Frequency)
710                                                                                                 $aSearch['aName'][$aSearchTerm['word_id']] = $aSearchTerm['word_id'];
711                                                                                         else
712                                                                                                 $aSearch['aNameNonSearch'][$aSearchTerm['word_id']] = $aSearchTerm['word_id'];
713                                                                                         $aSearch['iNamePhrase'] = $iPhrase;
714                                                                                         if ($aSearch['iSearchRank'] < $this->iMaxRank) $aNewWordsetSearches[] = $aSearch;
715                                                                                 }
716                                                                         }
717                                                                 }
718                                                         }
719                                                         else
720                                                         {
721                                                                 // Allow skipping a word - but at EXTREAM cost
722                                                                 //$aSearch = $aCurrentSearch;
723                                                                 //$aSearch['iSearchRank']+=100;
724                                                                 //$aNewWordsetSearches[] = $aSearch;
725                                                         }
726                                                 }
727                                                 // Sort and cut
728                                                 usort($aNewWordsetSearches, 'bySearchRank');
729                                                 $aWordsetSearches = array_slice($aNewWordsetSearches, 0, 50);
730                                         }
731                                         //var_Dump('<hr>',sizeof($aWordsetSearches)); exit;
732
733                                         $aNewPhraseSearches = array_merge($aNewPhraseSearches, $aNewWordsetSearches);
734                                         usort($aNewPhraseSearches, 'bySearchRank');
735
736                                         $aSearchHash = array();
737                                         foreach($aNewPhraseSearches as $iSearch => $aSearch)
738                                         {
739                                                 $sHash = serialize($aSearch);
740                                                 if (isset($aSearchHash[$sHash])) unset($aNewPhraseSearches[$iSearch]);
741                                                 else $aSearchHash[$sHash] = 1;
742                                         }
743
744                                         $aNewPhraseSearches = array_slice($aNewPhraseSearches, 0, 50);
745                                 }
746
747                                 // Re-group the searches by their score, junk anything over 20 as just not worth trying
748                                 $aGroupedSearches = array();
749                                 foreach($aNewPhraseSearches as $aSearch)
750                                 {
751                                         if ($aSearch['iSearchRank'] < $this->iMaxRank)
752                                         {
753                                                 if (!isset($aGroupedSearches[$aSearch['iSearchRank']])) $aGroupedSearches[$aSearch['iSearchRank']] = array();
754                                                 $aGroupedSearches[$aSearch['iSearchRank']][] = $aSearch;
755                                         }
756                                 }
757                                 ksort($aGroupedSearches);
758
759                                 $iSearchCount = 0;
760                                 $aSearches = array();
761                                 foreach($aGroupedSearches as $iScore => $aNewSearches)
762                                 {
763                                         $iSearchCount += sizeof($aNewSearches);
764                                         $aSearches = array_merge($aSearches, $aNewSearches);
765                                         if ($iSearchCount > 50) break;
766                                 }
767
768                                 //if (CONST_Debug) _debugDumpGroupedSearches($aGroupedSearches, $aValidTokens);
769
770                         }
771                         return $aGroupedSearches;
772
773                 }
774
775                 /* Perform the actual query lookup.
776
777                         Returns an ordered list of results, each with the following fields:
778                                 osm_type: type of corresponding OSM object
779                                                         N - node
780                                                         W - way
781                                                         R - relation
782                                                         P - postcode (internally computed)
783                                 osm_id: id of corresponding OSM object
784                                 class: general object class (corresponds to tag key of primary OSM tag)
785                                 type: subclass of object (corresponds to tag value of primary OSM tag)
786                                 admin_level: see http://wiki.openstreetmap.org/wiki/Admin_level
787                                 rank_search: rank in search hierarchy
788                                                         (see also http://wiki.openstreetmap.org/wiki/Nominatim/Development_overview#Country_to_street_level)
789                                 rank_address: rank in address hierarchy (determines orer in address)
790                                 place_id: internal key (may differ between different instances)
791                                 country_code: ISO country code
792                                 langaddress: localized full address
793                                 placename: localized name of object
794                                 ref: content of ref tag (if available)
795                                 lon: longitude
796                                 lat: latitude
797                                 importance: importance of place based on Wikipedia link count
798                                 addressimportance: cumulated importance of address elements
799                                 extra_place: type of place (for admin boundaries, if there is a place tag)
800                                 aBoundingBox: bounding Box
801                                 label: short description of the object class/type (English only)
802                                 name: full name (currently the same as langaddress)
803                                 foundorder: secondary ordering for places with same importance
804                 */
805                 function lookup()
806                 {
807                         if (!$this->sQuery && !$this->aStructuredQuery) return false;
808
809                         $sLanguagePrefArraySQL = "ARRAY[".join(',',array_map("getDBQuoted",$this->aLangPrefOrder))."]";
810                         $sCountryCodesSQL = false;
811                         if ($this->aCountryCodes && sizeof($this->aCountryCodes))
812                         {
813                                 $sCountryCodesSQL = join(',', array_map('addQuotes', $this->aCountryCodes));
814                         }
815
816                         $sQuery = $this->sQuery;
817
818                         // Conflicts between US state abreviations and various words for 'the' in different languages
819                         if (isset($this->aLangPrefOrder['name:en']))
820                         {
821                                 $sQuery = preg_replace('/(^|,)\s*il\s*(,|$)/','\1illinois\2', $sQuery);
822                                 $sQuery = preg_replace('/(^|,)\s*al\s*(,|$)/','\1alabama\2', $sQuery);
823                                 $sQuery = preg_replace('/(^|,)\s*la\s*(,|$)/','\1louisiana\2', $sQuery);
824                         }
825
826                         // View Box SQL
827                         $sViewboxCentreSQL = false;
828                         $bBoundingBoxSearch = false;
829                         if ($this->aViewBox)
830                         {
831                                 $fHeight = $this->aViewBox[0]-$this->aViewBox[2];
832                                 $fWidth = $this->aViewBox[1]-$this->aViewBox[3];
833                                 $aBigViewBox[0] = $this->aViewBox[0] + $fHeight;
834                                 $aBigViewBox[2] = $this->aViewBox[2] - $fHeight;
835                                 $aBigViewBox[1] = $this->aViewBox[1] + $fWidth;
836                                 $aBigViewBox[3] = $this->aViewBox[3] - $fWidth;
837
838                                 $this->sViewboxSmallSQL = "ST_SetSRID(ST_MakeBox2D(ST_Point(".(float)$this->aViewBox[0].",".(float)$this->aViewBox[1]."),ST_Point(".(float)$this->aViewBox[2].",".(float)$this->aViewBox[3].")),4326)";
839                                 $this->sViewboxLargeSQL = "ST_SetSRID(ST_MakeBox2D(ST_Point(".(float)$aBigViewBox[0].",".(float)$aBigViewBox[1]."),ST_Point(".(float)$aBigViewBox[2].",".(float)$aBigViewBox[3].")),4326)";
840                                 $bBoundingBoxSearch = $this->bBoundedSearch;
841                         }
842
843                         // Route SQL
844                         if ($this->aRoutePoints)
845                         {
846                                 $sViewboxCentreSQL = "ST_SetSRID('LINESTRING(";
847                                 $bFirst = true;
848                                 foreach($this->aRoutePoints as $aPoint)
849                                 {
850                                         if (!$bFirst) $sViewboxCentreSQL .= ",";
851                                         $sViewboxCentreSQL .= $aPoint[0].' '.$aPoint[1];
852                                         $bFirst = false;
853                                 }
854                                 $sViewboxCentreSQL .= ")'::geometry,4326)";
855
856                                 $sSQL = "select st_buffer(".$sViewboxCentreSQL.",".(float)($_GET['routewidth']/69).")";
857                                 $this->sViewboxSmallSQL = $this->oDB->getOne($sSQL);
858                                 if (PEAR::isError($this->sViewboxSmallSQL))
859                                 {
860                                         failInternalError("Could not get small viewbox.", $sSQL, $this->sViewboxSmallSQL);
861                                 }
862                                 $this->sViewboxSmallSQL = "'".$this->sViewboxSmallSQL."'::geometry";
863
864                                 $sSQL = "select st_buffer(".$sViewboxCentreSQL.",".(float)($_GET['routewidth']/30).")";
865                                 $this->sViewboxLargeSQL = $this->oDB->getOne($sSQL);
866                                 if (PEAR::isError($this->sViewboxLargeSQL))
867                                 {
868                                         failInternalError("Could not get large viewbox.", $sSQL, $this->sViewboxLargeSQL);
869                                 }
870                                 $this->sViewboxLargeSQL = "'".$this->sViewboxLargeSQL."'::geometry";
871                                 $bBoundingBoxSearch = $this->bBoundedSearch;
872                         }
873
874                         // Do we have anything that looks like a lat/lon pair?
875                         if ( $aLooksLike = looksLikeLatLonPair($sQuery) )
876             {
877                                 $this->setNearPoint(array($aLooksLike['lat'], $aLooksLike['lon']));
878                                 $sQuery = $aLooksLike['query'];
879                         }
880
881                         $aSearchResults = array();
882                         if ($sQuery || $this->aStructuredQuery)
883                         {
884                                 // Start with a blank search
885                                 $aSearches = array(
886                                         array('iSearchRank' => 0,
887                                                                 'iNamePhrase' => -1,
888                                                                 'sCountryCode' => false,
889                                                                 'aName' => array(),
890                                                                 'aAddress' => array(),
891                                                                 'aFullNameAddress' => array(),
892                                                                 'aNameNonSearch' => array(),
893                                                                 'aAddressNonSearch' => array(),
894                                                                 'sOperator' => '',
895                                                                 'aFeatureName' => array(),
896                                                                 'sClass' => '',
897                                                                 'sType' => '',
898                                                                 'sHouseNumber' => '',
899                                                                 'fLat' => '',
900                                                                 'fLon' => '',
901                                                                 'fRadius' => ''
902                                                         )
903                                 );
904
905                                 // Do we have a radius search?
906                                 $sNearPointSQL = false;
907                                 if ($this->aNearPoint)
908                                 {
909                                         $sNearPointSQL = "ST_SetSRID(ST_Point(".(float)$this->aNearPoint[1].",".(float)$this->aNearPoint[0]."),4326)";
910                                         $aSearches[0]['fLat'] = (float)$this->aNearPoint[0];
911                                         $aSearches[0]['fLon'] = (float)$this->aNearPoint[1];
912                                         $aSearches[0]['fRadius'] = (float)$this->aNearPoint[2];
913                                 }
914
915                                 // Any 'special' terms in the search?
916                                 $bSpecialTerms = false;
917                                 preg_match_all('/\\[(.*)=(.*)\\]/', $sQuery, $aSpecialTermsRaw, PREG_SET_ORDER);
918                                 $aSpecialTerms = array();
919                                 foreach($aSpecialTermsRaw as $aSpecialTerm)
920                                 {
921                                         $sQuery = str_replace($aSpecialTerm[0], ' ', $sQuery);
922                                         $aSpecialTerms[strtolower($aSpecialTerm[1])] = $aSpecialTerm[2];
923                                 }
924
925                                 preg_match_all('/\\[([\\w ]*)\\]/u', $sQuery, $aSpecialTermsRaw, PREG_SET_ORDER);
926                                 $aSpecialTerms = array();
927                                 if (isset($this->aStructuredQuery['amenity']) && $this->aStructuredQuery['amenity'])
928                                 {
929                                         $aSpecialTermsRaw[] = array('['.$this->aStructuredQuery['amenity'].']', $this->aStructuredQuery['amenity']);
930                                         unset($this->aStructuredQuery['amenity']);
931                                 }
932                                 foreach($aSpecialTermsRaw as $aSpecialTerm)
933                                 {
934                                         $sQuery = str_replace($aSpecialTerm[0], ' ', $sQuery);
935                                         $sToken = $this->oDB->getOne("select make_standard_name('".$aSpecialTerm[1]."') as string");
936                                         $sSQL = 'select * from (select word_id,word_token, word, class, type, country_code, operator';
937                                         $sSQL .= ' from word where word_token in (\' '.$sToken.'\')) as x where (class is not null and class not in (\'place\')) or country_code is not null';
938                                         if (CONST_Debug) var_Dump($sSQL);
939                                         $aSearchWords = $this->oDB->getAll($sSQL);
940                                         $aNewSearches = array();
941                                         foreach($aSearches as $aSearch)
942                                         {
943                                                 foreach($aSearchWords as $aSearchTerm)
944                                                 {
945                                                         $aNewSearch = $aSearch;
946                                                         if ($aSearchTerm['country_code'])
947                                                         {
948                                                                 $aNewSearch['sCountryCode'] = strtolower($aSearchTerm['country_code']);
949                                                                 $aNewSearches[] = $aNewSearch;
950                                                                 $bSpecialTerms = true;
951                                                         }
952                                                         if ($aSearchTerm['class'])
953                                                         {
954                                                                 $aNewSearch['sClass'] = $aSearchTerm['class'];
955                                                                 $aNewSearch['sType'] = $aSearchTerm['type'];
956                                                                 $aNewSearches[] = $aNewSearch;
957                                                                 $bSpecialTerms = true;
958                                                         }
959                                                 }
960                                         }
961                                         $aSearches = $aNewSearches;
962                                 }
963
964                                 // Split query into phrases
965                                 // Commas are used to reduce the search space by indicating where phrases split
966                                 if ($this->aStructuredQuery)
967                                 {
968                                         $aPhrases = $this->aStructuredQuery;
969                                         $bStructuredPhrases = true;
970                                 }
971                                 else
972                                 {
973                                         $aPhrases = explode(',',$sQuery);
974                                         $bStructuredPhrases = false;
975                                 }
976
977                                 // Convert each phrase to standard form
978                                 // Create a list of standard words
979                                 // Get all 'sets' of words
980                                 // Generate a complete list of all
981                                 $aTokens = array();
982                                 foreach($aPhrases as $iPhrase => $sPhrase)
983                                 {
984                                         $aPhrase = $this->oDB->getRow("select make_standard_name('".pg_escape_string($sPhrase)."') as string");
985                                         if (PEAR::isError($aPhrase))
986                                         {
987                                                 userError("Illegal query string (not an UTF-8 string): ".$sPhrase);
988                                                 if (CONST_Debug) var_dump($aPhrase);
989                                                 exit;
990                                         }
991                                         if (trim($aPhrase['string']))
992                                         {
993                                                 $aPhrases[$iPhrase] = $aPhrase;
994                                                 $aPhrases[$iPhrase]['words'] = explode(' ',$aPhrases[$iPhrase]['string']);
995                                                 $aPhrases[$iPhrase]['wordsets'] = getWordSets($aPhrases[$iPhrase]['words'], 0);
996                                                 $aTokens = array_merge($aTokens, getTokensFromSets($aPhrases[$iPhrase]['wordsets']));
997                                         }
998                                         else
999                                         {
1000                                                 unset($aPhrases[$iPhrase]);
1001                                         }
1002                                 }
1003
1004                                 // Reindex phrases - we make assumptions later on that they are numerically keyed in order
1005                                 $aPhraseTypes = array_keys($aPhrases);
1006                                 $aPhrases = array_values($aPhrases);
1007
1008                                 if (sizeof($aTokens))
1009                                 {
1010                                         // Check which tokens we have, get the ID numbers
1011                                         $sSQL = 'select word_id,word_token, word, class, type, country_code, operator, search_name_count';
1012                                         $sSQL .= ' from word where word_token in ('.join(',',array_map("getDBQuoted",$aTokens)).')';
1013
1014                                         if (CONST_Debug) var_Dump($sSQL);
1015
1016                                         $aValidTokens = array();
1017                                         if (sizeof($aTokens)) $aDatabaseWords = $this->oDB->getAll($sSQL);
1018                                         else $aDatabaseWords = array();
1019                                         if (PEAR::IsError($aDatabaseWords))
1020                                         {
1021                                                 failInternalError("Could not get word tokens.", $sSQL, $aDatabaseWords);
1022                                         }
1023                                         $aPossibleMainWordIDs = array();
1024                                         $aWordFrequencyScores = array();
1025                                         foreach($aDatabaseWords as $aToken)
1026                                         {
1027                                                 // Very special case - require 2 letter country param to match the country code found
1028                                                 if ($bStructuredPhrases && $aToken['country_code'] && !empty($this->aStructuredQuery['country'])
1029                                                                 && strlen($this->aStructuredQuery['country']) == 2 && strtolower($this->aStructuredQuery['country']) != $aToken['country_code'])
1030                                                 {
1031                                                         continue;
1032                                                 }
1033
1034                                                 if (isset($aValidTokens[$aToken['word_token']]))
1035                                                 {
1036                                                         $aValidTokens[$aToken['word_token']][] = $aToken;
1037                                                 }
1038                                                 else
1039                                                 {
1040                                                         $aValidTokens[$aToken['word_token']] = array($aToken);
1041                                                 }
1042                                                 if (!$aToken['class'] && !$aToken['country_code']) $aPossibleMainWordIDs[$aToken['word_id']] = 1;
1043                                                 $aWordFrequencyScores[$aToken['word_id']] = $aToken['search_name_count'] + 1;
1044                                         }
1045                                         if (CONST_Debug) var_Dump($aPhrases, $aValidTokens);
1046
1047                                         // Try and calculate GB postcodes we might be missing
1048                                         foreach($aTokens as $sToken)
1049                                         {
1050                                                 // Source of gb postcodes is now definitive - always use
1051                                                 if (preg_match('/^([A-Z][A-Z]?[0-9][0-9A-Z]? ?[0-9])([A-Z][A-Z])$/', strtoupper(trim($sToken)), $aData))
1052                                                 {
1053                                                         if (substr($aData[1],-2,1) != ' ')
1054                                                         {
1055                                                                 $aData[0] = substr($aData[0],0,strlen($aData[1])-1).' '.substr($aData[0],strlen($aData[1])-1);
1056                                                                 $aData[1] = substr($aData[1],0,-1).' '.substr($aData[1],-1,1);
1057                                                         }
1058                                                         $aGBPostcodeLocation = gbPostcodeCalculate($aData[0], $aData[1], $aData[2], $this->oDB);
1059                                                         if ($aGBPostcodeLocation)
1060                                                         {
1061                                                                 $aValidTokens[$sToken] = $aGBPostcodeLocation;
1062                                                         }
1063                                                 }
1064                                                 // US ZIP+4 codes - if there is no token,
1065                                                 //      merge in the 5-digit ZIP code
1066                                                 else if (!isset($aValidTokens[$sToken]) && preg_match('/^([0-9]{5}) [0-9]{4}$/', $sToken, $aData))
1067                                                 {
1068                                                         if (isset($aValidTokens[$aData[1]]))
1069                                                         {
1070                                                                 foreach($aValidTokens[$aData[1]] as $aToken)
1071                                                                 {
1072                                                                         if (!$aToken['class'])
1073                                                                         {
1074                                                                                 if (isset($aValidTokens[$sToken]))
1075                                                                                 {
1076                                                                                         $aValidTokens[$sToken][] = $aToken;
1077                                                                                 }
1078                                                                                 else
1079                                                                                 {
1080                                                                                         $aValidTokens[$sToken] = array($aToken);
1081                                                                                 }
1082                                                                         }
1083                                                                 }
1084                                                         }
1085                                                 }
1086                                         }
1087
1088                                         foreach($aTokens as $sToken)
1089                                         {
1090                                                 // Unknown single word token with a number - assume it is a house number
1091                                                 if (!isset($aValidTokens[' '.$sToken]) && strpos($sToken,' ') === false && preg_match('/[0-9]/', $sToken))
1092                                                 {
1093                                                         $aValidTokens[' '.$sToken] = array(array('class'=>'place','type'=>'house'));
1094                                                 }
1095                                         }
1096
1097                                         // Any words that have failed completely?
1098                                         // TODO: suggestions
1099
1100                                         // Start the search process
1101                                         // array with: placeid => -1 | tiger-housenumber
1102                                         $aResultPlaceIDs = array();
1103
1104                                         $aGroupedSearches = $this->getGroupedSearches($aSearches, $aPhraseTypes, $aPhrases, $aValidTokens, $aWordFrequencyScores, $bStructuredPhrases);
1105
1106                                         if ($this->bReverseInPlan)
1107                                         {
1108                                                 // Reverse phrase array and also reverse the order of the wordsets in
1109                                                 // the first and final phrase. Don't bother about phrases in the middle
1110                                                 // because order in the address doesn't matter.
1111                                                 $aPhrases = array_reverse($aPhrases);
1112                                                 $aPhrases[0]['wordsets'] = getInverseWordSets($aPhrases[0]['words'], 0);
1113                                                 if (sizeof($aPhrases) > 1)
1114                                                 {
1115                                                         $aFinalPhrase = end($aPhrases);
1116                                                         $aPhrases[sizeof($aPhrases)-1]['wordsets'] = getInverseWordSets($aFinalPhrase['words'], 0);
1117                                                 }
1118                                                 $aReverseGroupedSearches = $this->getGroupedSearches($aSearches, null, $aPhrases, $aValidTokens, $aWordFrequencyScores, false);
1119
1120                                                 foreach($aGroupedSearches as $aSearches)
1121                                                 {
1122                                                         foreach($aSearches as $aSearch)
1123                                                         {
1124                                                                 if ($aSearch['iSearchRank'] < $this->iMaxRank)
1125                                                                 {
1126                                                                         if (!isset($aReverseGroupedSearches[$aSearch['iSearchRank']])) $aReverseGroupedSearches[$aSearch['iSearchRank']] = array();
1127                                                                         $aReverseGroupedSearches[$aSearch['iSearchRank']][] = $aSearch;
1128                                                                 }
1129
1130                                                         }
1131                                                 }
1132
1133                                                 $aGroupedSearches = $aReverseGroupedSearches;
1134                                                 ksort($aGroupedSearches);
1135                                         }
1136                                 }
1137                                 else
1138                                 {
1139                                         // Re-group the searches by their score, junk anything over 20 as just not worth trying
1140                                         $aGroupedSearches = array();
1141                                         foreach($aSearches as $aSearch)
1142                                         {
1143                                                 if ($aSearch['iSearchRank'] < $this->iMaxRank)
1144                                                 {
1145                                                         if (!isset($aGroupedSearches[$aSearch['iSearchRank']])) $aGroupedSearches[$aSearch['iSearchRank']] = array();
1146                                                         $aGroupedSearches[$aSearch['iSearchRank']][] = $aSearch;
1147                                                 }
1148                                         }
1149                                         ksort($aGroupedSearches);
1150                                 }
1151
1152                                 if (CONST_Debug) var_Dump($aGroupedSearches);
1153
1154                                 if (CONST_Search_TryDroppedAddressTerms && sizeof($this->aStructuredQuery) > 0)
1155                                 {
1156                                         $aCopyGroupedSearches = $aGroupedSearches;
1157                                         foreach($aCopyGroupedSearches as $iGroup => $aSearches)
1158                                         {
1159                                                 foreach($aSearches as $iSearch => $aSearch)
1160                                                 {
1161                                                         $aReductionsList = array($aSearch['aAddress']);
1162                                                         $iSearchRank = $aSearch['iSearchRank'];
1163                                                         while(sizeof($aReductionsList) > 0)
1164                                                         {
1165                                                                 $iSearchRank += 5;
1166                                                                 if ($iSearchRank > iMaxRank) break 3;
1167                                                                 $aNewReductionsList = array();
1168                                                                 foreach($aReductionsList as $aReductionsWordList)
1169                                                                 {
1170                                                                         for ($iReductionWord = 0; $iReductionWord < sizeof($aReductionsWordList); $iReductionWord++)
1171                                                                         {
1172                                                                                 $aReductionsWordListResult = array_merge(array_slice($aReductionsWordList, 0, $iReductionWord), array_slice($aReductionsWordList, $iReductionWord+1));
1173                                                                                 $aReverseSearch = $aSearch;
1174                                                                                 $aSearch['aAddress'] = $aReductionsWordListResult;
1175                                                                                 $aSearch['iSearchRank'] = $iSearchRank;
1176                                                                                 $aGroupedSearches[$iSearchRank][] = $aReverseSearch;
1177                                                                                 if (sizeof($aReductionsWordListResult) > 0)
1178                                                                                 {
1179                                                                                         $aNewReductionsList[] = $aReductionsWordListResult;
1180                                                                                 }
1181                                                                         }
1182                                                                 }
1183                                                                 $aReductionsList = $aNewReductionsList;
1184                                                         }
1185                                                 }
1186                                         }
1187                                         ksort($aGroupedSearches);
1188                                 }
1189
1190                                 // Filter out duplicate searches
1191                                 $aSearchHash = array();
1192                                 foreach($aGroupedSearches as $iGroup => $aSearches)
1193                                 {
1194                                         foreach($aSearches as $iSearch => $aSearch)
1195                                         {
1196                                                 $sHash = serialize($aSearch);
1197                                                 if (isset($aSearchHash[$sHash]))
1198                                                 {
1199                                                         unset($aGroupedSearches[$iGroup][$iSearch]);
1200                                                         if (sizeof($aGroupedSearches[$iGroup]) == 0) unset($aGroupedSearches[$iGroup]);
1201                                                 }
1202                                                 else
1203                                                 {
1204                                                         $aSearchHash[$sHash] = 1;
1205                                                 }
1206                                         }
1207                                 }
1208
1209                                 if (CONST_Debug) _debugDumpGroupedSearches($aGroupedSearches, $aValidTokens);
1210
1211                                 $iGroupLoop = 0;
1212                                 $iQueryLoop = 0;
1213                                 foreach($aGroupedSearches as $iGroupedRank => $aSearches)
1214                                 {
1215                                         $iGroupLoop++;
1216                                         foreach($aSearches as $aSearch)
1217                                         {
1218                                                 $iQueryLoop++;
1219                                                 $searchedHousenumber = -1;
1220
1221                                                 if (CONST_Debug) { echo "<hr><b>Search Loop, group $iGroupLoop, loop $iQueryLoop</b>"; }
1222                                                 if (CONST_Debug) _debugDumpGroupedSearches(array($iGroupedRank => array($aSearch)), $aValidTokens);
1223
1224                                                 // No location term?
1225                                                 if (!sizeof($aSearch['aName']) && !sizeof($aSearch['aAddress']) && !$aSearch['fLon'])
1226                                                 {
1227                                                         if ($aSearch['sCountryCode'] && !$aSearch['sClass'] && !$aSearch['sHouseNumber'])
1228                                                         {
1229                                                                 // Just looking for a country by code - look it up
1230                                                                 if (4 >= $this->iMinAddressRank && 4 <= $this->iMaxAddressRank)
1231                                                                 {
1232                                                                         $sSQL = "select place_id from placex where calculated_country_code='".$aSearch['sCountryCode']."' and rank_search = 4";
1233                                                                         if ($sCountryCodesSQL) $sSQL .= " and calculated_country_code in ($sCountryCodesSQL)";
1234                                                                         if ($bBoundingBoxSearch)
1235                                                                                 $sSQL .= " and _st_intersects($this->sViewboxSmallSQL, geometry)";
1236                                                                         $sSQL .= " order by st_area(geometry) desc limit 1";
1237                                                                         if (CONST_Debug) var_dump($sSQL);
1238                                                                         $aPlaceIDs = $this->oDB->getCol($sSQL);
1239                                                                 }
1240                                                                 else
1241                                                                 {
1242                                                                         $aPlaceIDs = array();
1243                                                                 }
1244                                                         }
1245                                                         else
1246                                                         {
1247                                                                 if (!$bBoundingBoxSearch && !$aSearch['fLon']) continue;
1248                                                                 if (!$aSearch['sClass']) continue;
1249                                                                 $sSQL = "select count(*) from pg_tables where tablename = 'place_classtype_".$aSearch['sClass']."_".$aSearch['sType']."'";
1250                                                                 if ($this->oDB->getOne($sSQL))
1251                                                                 {
1252                                                                         $sSQL = "select place_id from place_classtype_".$aSearch['sClass']."_".$aSearch['sType']." ct";
1253                                                                         if ($sCountryCodesSQL) $sSQL .= " join placex using (place_id)";
1254                                                                         $sSQL .= " where st_contains($this->sViewboxSmallSQL, ct.centroid)";
1255                                                                         if ($sCountryCodesSQL) $sSQL .= " and calculated_country_code in ($sCountryCodesSQL)";
1256                                                                         if (sizeof($this->aExcludePlaceIDs))
1257                                                                         {
1258                                                                                 $sSQL .= " and place_id not in (".join(',',$this->aExcludePlaceIDs).")";
1259                                                                         }
1260                                                                         if ($sViewboxCentreSQL) $sSQL .= " order by st_distance($sViewboxCentreSQL, ct.centroid) asc";
1261                                                                         $sSQL .= " limit $this->iLimit";
1262                                                                         if (CONST_Debug) var_dump($sSQL);
1263                                                                         $aPlaceIDs = $this->oDB->getCol($sSQL);
1264
1265                                                                         // If excluded place IDs are given, it is fair to assume that
1266                                                                         // there have been results in the small box, so no further
1267                                                                         // expansion in that case.
1268                                                                         // Also don't expand if bounded results were requested.
1269                                                                         if (!sizeof($aPlaceIDs) && !sizeof($this->aExcludePlaceIDs) && !$this->bBoundedSearch)
1270                                                                         {
1271                                                                                 $sSQL = "select place_id from place_classtype_".$aSearch['sClass']."_".$aSearch['sType']." ct";
1272                                                                                 if ($sCountryCodesSQL) $sSQL .= " join placex using (place_id)";
1273                                                                                 $sSQL .= " where st_contains($this->sViewboxLargeSQL, ct.centroid)";
1274                                                                                 if ($sCountryCodesSQL) $sSQL .= " and calculated_country_code in ($sCountryCodesSQL)";
1275                                                                                 if ($sViewboxCentreSQL) $sSQL .= " order by st_distance($sViewboxCentreSQL, ct.centroid) asc";
1276                                                                                 $sSQL .= " limit $this->iLimit";
1277                                                                                 if (CONST_Debug) var_dump($sSQL);
1278                                                                                 $aPlaceIDs = $this->oDB->getCol($sSQL);
1279                                                                         }
1280                                                                 }
1281                                                                 else
1282                                                                 {
1283                                                                         $sSQL = "select place_id from placex where class='".$aSearch['sClass']."' and type='".$aSearch['sType']."'";
1284                                                                         $sSQL .= " and st_contains($this->sViewboxSmallSQL, geometry) and linked_place_id is null";
1285                                                                         if ($sCountryCodesSQL) $sSQL .= " and calculated_country_code in ($sCountryCodesSQL)";
1286                                                                         if ($sViewboxCentreSQL) $sSQL .= " order by st_distance($sViewboxCentreSQL, centroid) asc";
1287                                                                         $sSQL .= " limit $this->iLimit";
1288                                                                         if (CONST_Debug) var_dump($sSQL);
1289                                                                         $aPlaceIDs = $this->oDB->getCol($sSQL);
1290                                                                 }
1291                                                         }
1292                                                 }
1293                                                 else
1294                                                 {
1295                                                         $aPlaceIDs = array();
1296
1297                                                         // First we need a position, either aName or fLat or both
1298                                                         $aTerms = array();
1299                                                         $aOrder = array();
1300
1301                                                         if ($aSearch['sHouseNumber'] && sizeof($aSearch['aAddress']))
1302                                                         {
1303                                                                 $sHouseNumberRegex = '\\\\m'.$aSearch['sHouseNumber'].'\\\\M';
1304                                                                 $aOrder[] = "exists(select place_id from placex where parent_place_id = search_name.place_id and transliteration(housenumber) ~* E'".$sHouseNumberRegex."' limit 1) desc";
1305                                                         }
1306
1307                                                         // TODO: filter out the pointless search terms (2 letter name tokens and less)
1308                                                         // they might be right - but they are just too darned expensive to run
1309                                                         if (sizeof($aSearch['aName'])) $aTerms[] = "name_vector @> ARRAY[".join($aSearch['aName'],",")."]";
1310                                                         if (sizeof($aSearch['aNameNonSearch'])) $aTerms[] = "array_cat(name_vector,ARRAY[]::integer[]) @> ARRAY[".join($aSearch['aNameNonSearch'],",")."]";
1311                                                         if (sizeof($aSearch['aAddress']) && $aSearch['aName'] != $aSearch['aAddress'])
1312                                                         {
1313                                                                 // For infrequent name terms disable index usage for address
1314                                                                 if (CONST_Search_NameOnlySearchFrequencyThreshold &&
1315                                                                                 sizeof($aSearch['aName']) == 1 &&
1316                                                                                 $aWordFrequencyScores[$aSearch['aName'][reset($aSearch['aName'])]] < CONST_Search_NameOnlySearchFrequencyThreshold)
1317                                                                 {
1318                                                                         $aTerms[] = "array_cat(nameaddress_vector,ARRAY[]::integer[]) @> ARRAY[".join(array_merge($aSearch['aAddress'],$aSearch['aAddressNonSearch']),",")."]";
1319                                                                 }
1320                                                                 else
1321                                                                 {
1322                                                                         $aTerms[] = "nameaddress_vector @> ARRAY[".join($aSearch['aAddress'],",")."]";
1323                                                                         if (sizeof($aSearch['aAddressNonSearch'])) $aTerms[] = "array_cat(nameaddress_vector,ARRAY[]::integer[]) @> ARRAY[".join($aSearch['aAddressNonSearch'],",")."]";
1324                                                                 }
1325                                                         }
1326                                                         if ($aSearch['sCountryCode']) $aTerms[] = "country_code = '".pg_escape_string($aSearch['sCountryCode'])."'";
1327                                                         if ($aSearch['sHouseNumber'])
1328                                                         {
1329                                                                 $aTerms[] = "address_rank between 16 and 27";
1330                                                         }
1331                                                         else
1332                                                         {
1333                                                                 if ($this->iMinAddressRank > 0)
1334                                                                 {
1335                                                                         $aTerms[] = "address_rank >= ".$this->iMinAddressRank;
1336                                                                 }
1337                                                                 if ($this->iMaxAddressRank < 30)
1338                                                                 {
1339                                                                         $aTerms[] = "address_rank <= ".$this->iMaxAddressRank;
1340                                                                 }
1341                                                         }
1342                                                         if ($aSearch['fLon'] && $aSearch['fLat'])
1343                                                         {
1344                                                                 $aTerms[] = "ST_DWithin(centroid, ST_SetSRID(ST_Point(".$aSearch['fLon'].",".$aSearch['fLat']."),4326), ".$aSearch['fRadius'].")";
1345                                                                 $aOrder[] = "ST_Distance(centroid, ST_SetSRID(ST_Point(".$aSearch['fLon'].",".$aSearch['fLat']."),4326)) ASC";
1346                                                         }
1347                                                         if (sizeof($this->aExcludePlaceIDs))
1348                                                         {
1349                                                                 $aTerms[] = "place_id not in (".join(',',$this->aExcludePlaceIDs).")";
1350                                                         }
1351                                                         if ($sCountryCodesSQL)
1352                                                         {
1353                                                                 $aTerms[] = "country_code in ($sCountryCodesSQL)";
1354                                                         }
1355
1356                                                         if ($bBoundingBoxSearch) $aTerms[] = "centroid && $this->sViewboxSmallSQL";
1357                                                         if ($sNearPointSQL) $aOrder[] = "ST_Distance($sNearPointSQL, centroid) asc";
1358
1359                                                         if ($aSearch['sHouseNumber'])
1360                                                         {
1361                                                                 $sImportanceSQL = '- abs(26 - address_rank) + 3';
1362                                                         }
1363                                                         else
1364                                                         {
1365                                                                 $sImportanceSQL = '(case when importance = 0 OR importance IS NULL then 0.75-(search_rank::float/40) else importance end)';
1366                                                         }
1367                                                         if ($this->sViewboxSmallSQL) $sImportanceSQL .= " * case when ST_Contains($this->sViewboxSmallSQL, centroid) THEN 1 ELSE 0.5 END";
1368                                                         if ($this->sViewboxLargeSQL) $sImportanceSQL .= " * case when ST_Contains($this->sViewboxLargeSQL, centroid) THEN 1 ELSE 0.5 END";
1369
1370                                                         $aOrder[] = "$sImportanceSQL DESC";
1371                                                         if (sizeof($aSearch['aFullNameAddress']))
1372                                                         {
1373                                                                 $sExactMatchSQL = '(select count(*) from (select unnest(ARRAY['.join($aSearch['aFullNameAddress'],",").']) INTERSECT select unnest(nameaddress_vector))s) as exactmatch';
1374                                                                 $aOrder[] = 'exactmatch DESC';
1375                                                         } else {
1376                                                                 $sExactMatchSQL = '0::int as exactmatch';
1377                                                         }
1378
1379                                                         if (sizeof($aTerms))
1380                                                         {
1381                                                                 $sSQL = "select place_id, ";
1382                                                                 $sSQL .= $sExactMatchSQL;
1383                                                                 $sSQL .= " from search_name";
1384                                                                 $sSQL .= " where ".join(' and ',$aTerms);
1385                                                                 $sSQL .= " order by ".join(', ',$aOrder);
1386                                                                 if ($aSearch['sHouseNumber'] || $aSearch['sClass'])
1387                                                                         $sSQL .= " limit 20";
1388                                                                 elseif (!sizeof($aSearch['aName']) && !sizeof($aSearch['aAddress']) && $aSearch['sClass'])
1389                                                                         $sSQL .= " limit 1";
1390                                                                 else
1391                                                                         $sSQL .= " limit ".$this->iLimit;
1392
1393                                                                 if (CONST_Debug) { var_dump($sSQL); }
1394                                                                 $aViewBoxPlaceIDs = $this->oDB->getAll($sSQL);
1395                                                                 if (PEAR::IsError($aViewBoxPlaceIDs))
1396                                                                 {
1397                                                                         failInternalError("Could not get places for search terms.", $sSQL, $aViewBoxPlaceIDs);
1398                                                                 }
1399                                                                 //var_dump($aViewBoxPlaceIDs);
1400                                                                 // Did we have an viewbox matches?
1401                                                                 $aPlaceIDs = array();
1402                                                                 $bViewBoxMatch = false;
1403                                                                 foreach($aViewBoxPlaceIDs as $aViewBoxRow)
1404                                                                 {
1405                                                                         //if ($bViewBoxMatch == 1 && $aViewBoxRow['in_small'] == 'f') break;
1406                                                                         //if ($bViewBoxMatch == 2 && $aViewBoxRow['in_large'] == 'f') break;
1407                                                                         //if ($aViewBoxRow['in_small'] == 't') $bViewBoxMatch = 1;
1408                                                                         //else if ($aViewBoxRow['in_large'] == 't') $bViewBoxMatch = 2;
1409                                                                         $aPlaceIDs[] = $aViewBoxRow['place_id'];
1410                                                                         $this->exactMatchCache[$aViewBoxRow['place_id']] = $aViewBoxRow['exactmatch'];
1411                                                                 }
1412                                                         }
1413                                                         //var_Dump($aPlaceIDs);
1414                                                         //exit;
1415
1416                                                         //now search for housenumber, if housenumber provided
1417                                                         if ($aSearch['sHouseNumber'] && sizeof($aPlaceIDs))
1418                                                         {
1419                                                                 $aRoadPlaceIDs = $aPlaceIDs;
1420                                                                 $sPlaceIDs = join(',',$aPlaceIDs);
1421
1422                                                                 // Now they are indexed look for a house attached to a street we found
1423                                                                 $sHouseNumberRegex = '\\\\m'.$aSearch['sHouseNumber'].'\\\\M';
1424                                                                 $sSQL = "select place_id from placex where parent_place_id in (".$sPlaceIDs.") and transliteration(housenumber) ~* E'".$sHouseNumberRegex."'";
1425                                                                 if (sizeof($this->aExcludePlaceIDs))
1426                                                                 {
1427                                                                         $sSQL .= " and place_id not in (".join(',',$this->aExcludePlaceIDs).")";
1428                                                                 }
1429                                                                 $sSQL .= " limit $this->iLimit";
1430                                                                 if (CONST_Debug) var_dump($sSQL);
1431                                                                 $aPlaceIDs = $this->oDB->getCol($sSQL);
1432
1433                                                                 // If nothing found try the aux fallback table
1434                                                                 if (!sizeof($aPlaceIDs))
1435                                                                 {
1436                                                                         $sSQL = "select place_id from location_property_aux where parent_place_id in (".$sPlaceIDs.") and housenumber = '".pg_escape_string($aSearch['sHouseNumber'])."'";
1437                                                                         if (sizeof($this->aExcludePlaceIDs))
1438                                                                         {
1439                                                                                 $sSQL .= " and place_id not in (".join(',',$this->aExcludePlaceIDs).")";
1440                                                                         }
1441                                                                         //$sSQL .= " limit $this->iLimit";
1442                                                                         if (CONST_Debug) var_dump($sSQL);
1443                                                                         $aPlaceIDs = $this->oDB->getCol($sSQL);
1444                                                                 }
1445                                                                 //if nothing was found in placex or location_property_aux, then search in Tiger data for this housenumber(location_property_tiger)
1446                                                                 $searchedHousenumber = intval($aSearch['sHouseNumber']);
1447                                                                 if (!sizeof($aPlaceIDs))
1448                                                                 {
1449                                                                         //new query for lines, not housenumbers anymore
1450                                                                         if($searchedHousenumber%2 == 0){
1451                                                                                 //if housenumber is even, look for housenumber in streets with interpolationtype even or all
1452                                                                                 $sSQL = "select distinct place_id from location_property_tiger where parent_place_id in (".$sPlaceIDs.") and (interpolationtype='even' or interpolationtype='all') and ".$searchedHousenumber.">=startnumber and ".$searchedHousenumber."<=endnumber";
1453                                                                         }else{
1454                                                                                 //look for housenumber in streets with interpolationtype odd or all
1455                                                                                 $sSQL = "select distinct place_id from location_property_tiger where parent_place_id in (".$sPlaceIDs.") and (interpolationtype='odd' or interpolationtype='all') and ".$searchedHousenumber.">=startnumber and ".$searchedHousenumber."<=endnumber";
1456                                                                         }
1457
1458                                                                         if (sizeof($this->aExcludePlaceIDs))
1459                                                                         {
1460                                                                                 $sSQL .= " and place_id not in (".join(',', $this->aExcludePlaceIDs).")";
1461                                                                         }
1462                                                                         //$sSQL .= " limit $this->iLimit";
1463                                                                         if (CONST_Debug) var_dump($sSQL);
1464                                                                         //get place IDs
1465                                                                         $aPlaceIDs = $this->oDB->getCol($sSQL, 0);
1466                                                                 }
1467
1468                                                                 // Fallback to the road (if no housenumber was found)
1469                                                                 if (!sizeof($aPlaceIDs) && preg_match('/[0-9]+/', $aSearch['sHouseNumber']))
1470                                                                 {
1471                                                                         $aPlaceIDs = $aRoadPlaceIDs;
1472                                                                         //set to -1, if no housenumbers were found
1473                                                                         $searchedHousenumber = -1;
1474                                                                 }
1475                                 //else: housenumber was found, remains saved in searchedHousenumber
1476                                                         }
1477
1478
1479                                                         if ($aSearch['sClass'] && sizeof($aPlaceIDs))
1480                                                         {
1481                                                                 $sPlaceIDs = join(',', $aPlaceIDs);
1482                                                                 $aClassPlaceIDs = array();
1483
1484                                                                 if (!$aSearch['sOperator'] || $aSearch['sOperator'] == 'name')
1485                                                                 {
1486                                                                         // If they were searching for a named class (i.e. 'Kings Head pub') then we might have an extra match
1487                                                                         $sSQL = "select place_id from placex where place_id in ($sPlaceIDs) and class='".$aSearch['sClass']."' and type='".$aSearch['sType']."'";
1488                                                                         $sSQL .= " and linked_place_id is null";
1489                                                                         if ($sCountryCodesSQL) $sSQL .= " and calculated_country_code in ($sCountryCodesSQL)";
1490                                                                         $sSQL .= " order by rank_search asc limit $this->iLimit";
1491                                                                         if (CONST_Debug) var_dump($sSQL);
1492                                                                         $aClassPlaceIDs = $this->oDB->getCol($sSQL);
1493                                                                 }
1494
1495                                                                 if (!$aSearch['sOperator'] || $aSearch['sOperator'] == 'near') // & in
1496                                                                 {
1497                                                                         $sSQL = "select count(*) from pg_tables where tablename = 'place_classtype_".$aSearch['sClass']."_".$aSearch['sType']."'";
1498                                                                         $bCacheTable = $this->oDB->getOne($sSQL);
1499
1500                                                                         $sSQL = "select min(rank_search) from placex where place_id in ($sPlaceIDs)";
1501
1502                                                                         if (CONST_Debug) var_dump($sSQL);
1503                                                                         $this->iMaxRank = ((int)$this->oDB->getOne($sSQL));
1504
1505                                                                         // For state / country level searches the normal radius search doesn't work very well
1506                                                                         $sPlaceGeom = false;
1507                                                                         if ($this->iMaxRank < 9 && $bCacheTable)
1508                                                                         {
1509                                                                                 // Try and get a polygon to search in instead
1510                                                                                 $sSQL = "select geometry from placex where place_id in ($sPlaceIDs) and rank_search < $this->iMaxRank + 5 and st_geometrytype(geometry) in ('ST_Polygon','ST_MultiPolygon') order by rank_search asc limit 1";
1511                                                                                 if (CONST_Debug) var_dump($sSQL);
1512                                                                                 $sPlaceGeom = $this->oDB->getOne($sSQL);
1513                                                                         }
1514
1515                                                                         if ($sPlaceGeom)
1516                                                                         {
1517                                                                                 $sPlaceIDs = false;
1518                                                                         }
1519                                                                         else
1520                                                                         {
1521                                                                                 $this->iMaxRank += 5;
1522                                                                                 $sSQL = "select place_id from placex where place_id in ($sPlaceIDs) and rank_search < $this->iMaxRank";
1523                                                                                 if (CONST_Debug) var_dump($sSQL);
1524                                                                                 $aPlaceIDs = $this->oDB->getCol($sSQL);
1525                                                                                 $sPlaceIDs = join(',',$aPlaceIDs);
1526                                                                         }
1527
1528                                                                         if ($sPlaceIDs || $sPlaceGeom)
1529                                                                         {
1530
1531                                                                                 $fRange = 0.01;
1532                                                                                 if ($bCacheTable)
1533                                                                                 {
1534                                                                                         // More efficient - can make the range bigger
1535                                                                                         $fRange = 0.05;
1536
1537                                                                                         $sOrderBySQL = '';
1538                                                                                         if ($sNearPointSQL) $sOrderBySQL = "ST_Distance($sNearPointSQL, l.centroid)";
1539                                                                                         else if ($sPlaceIDs) $sOrderBySQL = "ST_Distance(l.centroid, f.geometry)";
1540                                                                                         else if ($sPlaceGeom) $sOrderBysSQL = "ST_Distance(st_centroid('".$sPlaceGeom."'), l.centroid)";
1541
1542                                                                                         $sSQL = "select distinct l.place_id".($sOrderBySQL?','.$sOrderBySQL:'')." from place_classtype_".$aSearch['sClass']."_".$aSearch['sType']." as l";
1543                                                                                         if ($sCountryCodesSQL) $sSQL .= " join placex as lp using (place_id)";
1544                                                                                         if ($sPlaceIDs)
1545                                                                                         {
1546                                                                                                 $sSQL .= ",placex as f where ";
1547                                                                                                 $sSQL .= "f.place_id in ($sPlaceIDs) and ST_DWithin(l.centroid, f.centroid, $fRange) ";
1548                                                                                         }
1549                                                                                         if ($sPlaceGeom)
1550                                                                                         {
1551                                                                                                 $sSQL .= " where ";
1552                                                                                                 $sSQL .= "ST_Contains('".$sPlaceGeom."', l.centroid) ";
1553                                                                                         }
1554                                                                                         if (sizeof($this->aExcludePlaceIDs))
1555                                                                                         {
1556                                                                                                 $sSQL .= " and l.place_id not in (".join(',',$this->aExcludePlaceIDs).")";
1557                                                                                         }
1558                                                                                         if ($sCountryCodesSQL) $sSQL .= " and lp.calculated_country_code in ($sCountryCodesSQL)";
1559                                                                                         if ($sOrderBySQL) $sSQL .= "order by ".$sOrderBySQL." asc";
1560                                                                                         if ($this->iOffset) $sSQL .= " offset $this->iOffset";
1561                                                                                         $sSQL .= " limit $this->iLimit";
1562                                                                                         if (CONST_Debug) var_dump($sSQL);
1563                                                                                         $aClassPlaceIDs = array_merge($aClassPlaceIDs, $this->oDB->getCol($sSQL));
1564                                                                                 }
1565                                                                                 else
1566                                                                                 {
1567                                                                                         if (isset($aSearch['fRadius']) && $aSearch['fRadius']) $fRange = $aSearch['fRadius'];
1568
1569                                                                                         $sOrderBySQL = '';
1570                                                                                         if ($sNearPointSQL) $sOrderBySQL = "ST_Distance($sNearPointSQL, l.geometry)";
1571                                                                                         else $sOrderBySQL = "ST_Distance(l.geometry, f.geometry)";
1572
1573                                                                                         $sSQL = "select distinct l.place_id".($sOrderBysSQL?','.$sOrderBysSQL:'')." from placex as l,placex as f where ";
1574                                                                                         $sSQL .= "f.place_id in ( $sPlaceIDs) and ST_DWithin(l.geometry, f.centroid, $fRange) ";
1575                                                                                         $sSQL .= "and l.class='".$aSearch['sClass']."' and l.type='".$aSearch['sType']."' ";
1576                                                                                         if (sizeof($this->aExcludePlaceIDs))
1577                                                                                         {
1578                                                                                                 $sSQL .= " and l.place_id not in (".join(',',$this->aExcludePlaceIDs).")";
1579                                                                                         }
1580                                                                                         if ($sCountryCodesSQL) $sSQL .= " and l.calculated_country_code in ($sCountryCodesSQL)";
1581                                                                                         if ($sOrderBy) $sSQL .= "order by ".$OrderBysSQL." asc";
1582                                                                                         if ($this->iOffset) $sSQL .= " offset $this->iOffset";
1583                                                                                         $sSQL .= " limit $this->iLimit";
1584                                                                                         if (CONST_Debug) var_dump($sSQL);
1585                                                                                         $aClassPlaceIDs = array_merge($aClassPlaceIDs, $this->oDB->getCol($sSQL));
1586                                                                                 }
1587                                                                         }
1588                                                                 }
1589
1590                                                                 $aPlaceIDs = $aClassPlaceIDs;
1591
1592                                                         }
1593
1594                                                 }
1595
1596                                                 if (PEAR::IsError($aPlaceIDs))
1597                                                 {
1598                                                         failInternalError("Could not get place IDs from tokens." ,$sSQL, $aPlaceIDs);
1599                                                 }
1600
1601                                                 if (CONST_Debug) { echo "<br><b>Place IDs:</b> "; var_Dump($aPlaceIDs); }
1602
1603                                                 foreach($aPlaceIDs as $iPlaceID)
1604                                                 {
1605                                                         // array for placeID => -1 | Tiger housenumber
1606                                                         $aResultPlaceIDs[$iPlaceID] = $searchedHousenumber;
1607                                                 }
1608                                                 if ($iQueryLoop > 20) break;
1609                                         }
1610
1611                                         if (isset($aResultPlaceIDs) && sizeof($aResultPlaceIDs) && ($this->iMinAddressRank != 0 || $this->iMaxAddressRank != 30))
1612                                         {
1613                                                 // Need to verify passes rank limits before dropping out of the loop (yuk!)
1614                                                 // reduces the number of place ids, like a filter
1615                                                 $sSQL = "select place_id from placex where place_id in (".join(',',array_keys($aResultPlaceIDs)).") ";
1616                                                 $sSQL .= "and (placex.rank_address between $this->iMinAddressRank and $this->iMaxAddressRank ";
1617                                                 if (14 >= $this->iMinAddressRank && 14 <= $this->iMaxAddressRank) $sSQL .= " OR (extratags->'place') = 'city'";
1618                                                 if ($this->aAddressRankList) $sSQL .= " OR placex.rank_address in (".join(',',$this->aAddressRankList).")";
1619                                                 $sSQL .= ") UNION select place_id from location_property_tiger where place_id in (".join(',',array_keys($aResultPlaceIDs)).") ";
1620                                                 $sSQL .= "and (30 between $this->iMinAddressRank and $this->iMaxAddressRank ";
1621                                                 if ($this->aAddressRankList) $sSQL .= " OR 30 in (".join(',',$this->aAddressRankList).")";
1622                                                 $sSQL .= ")";
1623                                                 if (CONST_Debug) var_dump($sSQL);
1624                                                 $aFilteredPlaceIDs = $this->oDB->getCol($sSQL);
1625                                                 $tempIDs = array();
1626                                                 foreach($aFilteredPlaceIDs as $placeID)
1627                         {
1628                                                         $tempIDs[$placeID] = $aResultPlaceIDs[$placeID];  //assign housenumber to placeID
1629                                                 }
1630                                                 $aResultPlaceIDs = $tempIDs;
1631                                         }
1632
1633                                         //exit;
1634                                         if (isset($aResultPlaceIDs) && sizeof($aResultPlaceIDs)) break;
1635                                         if ($iGroupLoop > 4) break;
1636                                         if ($iQueryLoop > 30) break;
1637                                 }
1638
1639                                 // Did we find anything?
1640                                 if (isset($aResultPlaceIDs) && sizeof($aResultPlaceIDs))
1641                                 {
1642                                         $aSearchResults = $this->getDetails($aResultPlaceIDs);
1643                                 }
1644
1645                         }
1646                         else
1647                         {
1648                                 // Just interpret as a reverse geocode
1649                                 $iPlaceID = geocodeReverse((float)$this->aNearPoint[0], (float)$this->aNearPoint[1]);
1650                                 if ($iPlaceID)
1651                                         $aSearchResults = $this->getDetails(array($iPlaceID));
1652                                 else
1653                                         $aSearchResults = array();
1654                         }
1655
1656                         // No results? Done
1657                         if (!sizeof($aSearchResults))
1658                         {
1659                                 if ($this->bFallback)
1660                                 {
1661                                         if ($this->fallbackStructuredQuery())
1662                                         {
1663                                                 return $this->lookup();
1664                                         }
1665                                 }
1666
1667                                 return array();
1668                         }
1669
1670                         $aClassType = getClassTypesWithImportance();
1671                         $aRecheckWords = preg_split('/\b[\s,\\-]*/u',$sQuery);
1672                         foreach($aRecheckWords as $i => $sWord)
1673                         {
1674                                 if (!preg_match('/\pL/', $sWord)) unset($aRecheckWords[$i]);
1675                         }
1676
1677                         if (CONST_Debug) { echo '<i>Recheck words:<\i>'; var_dump($aRecheckWords); }
1678
1679                         foreach($aSearchResults as $iResNum => $aResult)
1680                         {
1681                                 // Default
1682                                 $fDiameter = getResultDiameter($aResult);
1683
1684                                 $oPlaceLookup = new PlaceLookup($this->oDB);
1685                                 $oPlaceLookup->setIncludePolygonAsPoints($this->bIncludePolygonAsPoints);
1686                                 $oPlaceLookup->setIncludePolygonAsText($this->bIncludePolygonAsText);
1687                                 $oPlaceLookup->setIncludePolygonAsGeoJSON($this->bIncludePolygonAsGeoJSON);
1688                                 $oPlaceLookup->setIncludePolygonAsKML($this->bIncludePolygonAsKML);
1689                                 $oPlaceLookup->setIncludePolygonAsSVG($this->bIncludePolygonAsSVG);
1690                                 $oPlaceLookup->setPolygonSimplificationThreshold($this->fPolygonSimplificationThreshold);
1691
1692                                 $aOutlineResult = $oPlaceLookup->getOutlines($aResult['place_id'], $aResult['lon'], $aResult['lat'], $fDiameter/2);
1693                                 if ($aOutlineResult)
1694                                 {
1695                                         $aResult = array_merge($aResult, $aOutlineResult);
1696                                 }
1697                                 
1698                                 if ($aResult['extra_place'] == 'city')
1699                                 {
1700                                         $aResult['class'] = 'place';
1701                                         $aResult['type'] = 'city';
1702                                         $aResult['rank_search'] = 16;
1703                                 }
1704
1705                                 // Is there an icon set for this type of result?
1706                                 if (isset($aClassType[$aResult['class'].':'.$aResult['type']]['icon'])
1707                                                 && $aClassType[$aResult['class'].':'.$aResult['type']]['icon'])
1708                                 {
1709                                         $aResult['icon'] = CONST_Website_BaseURL.'images/mapicons/'.$aClassType[$aResult['class'].':'.$aResult['type']]['icon'].'.p.20.png';
1710                                 }
1711
1712                                 if (isset($aClassType[$aResult['class'].':'.$aResult['type'].':'.$aResult['admin_level']]['label'])
1713                                                 && $aClassType[$aResult['class'].':'.$aResult['type'].':'.$aResult['admin_level']]['label'])
1714                                 {
1715                                         $aResult['label'] = $aClassType[$aResult['class'].':'.$aResult['type'].':'.$aResult['admin_level']]['label'];
1716                                 }
1717                                 elseif (isset($aClassType[$aResult['class'].':'.$aResult['type']]['label'])
1718                                                 && $aClassType[$aResult['class'].':'.$aResult['type']]['label'])
1719                                 {
1720                                         $aResult['label'] = $aClassType[$aResult['class'].':'.$aResult['type']]['label'];
1721                                 }
1722                                 // if tag '&addressdetails=1' is set in query
1723                                 if ($this->bIncludeAddressDetails)
1724                                 {
1725                                         // getAddressDetails() is defined in lib.php and uses the SQL function get_addressdata in functions.sql
1726                                         $aResult['address'] = getAddressDetails($this->oDB, $sLanguagePrefArraySQL, $aResult['place_id'], $aResult['country_code'], $aResultPlaceIDs[$aResult['place_id']]);
1727                                         if ($aResult['extra_place'] == 'city' && !isset($aResult['address']['city']))
1728                                         {
1729                                                 $aResult['address'] = array_merge(array('city' => array_shift(array_values($aResult['address']))), $aResult['address']);
1730                                         }
1731                                 }
1732                                 if ($this->bIncludeExtraTags)
1733                                 {
1734                                         if ($aResult['extra'])
1735                                         {
1736                                                 $aResult['sExtraTags'] = json_decode($aResult['extra']);
1737                                         }
1738                                         else
1739                                         {
1740                                                 $aResult['sExtraTags'] = (object) array();
1741                                         }
1742                                 }
1743
1744                                 if ($this->bIncludeNameDetails)
1745                                 {
1746                                         if ($aResult['names'])
1747                                         {
1748                                                 $aResult['sNameDetails'] = json_decode($aResult['names']);
1749                                         }
1750                                         else
1751                                         {
1752                                                 $aResult['sNameDetails'] = (object) array();
1753                                         }
1754                                 }
1755
1756                                 // Adjust importance for the number of exact string matches in the result
1757                                 $aResult['importance'] = max(0.001,$aResult['importance']);
1758                                 $iCountWords = 0;
1759                                 $sAddress = $aResult['langaddress'];
1760                                 foreach($aRecheckWords as $i => $sWord)
1761                                 {
1762                                         if (stripos($sAddress, $sWord)!==false)
1763                                         {
1764                                                 $iCountWords++;
1765                                                 if (preg_match("/(^|,)\s*".preg_quote($sWord, '/')."\s*(,|$)/", $sAddress)) $iCountWords += 0.1;
1766                                         }
1767                                 }
1768
1769                                 $aResult['importance'] = $aResult['importance'] + ($iCountWords*0.1); // 0.1 is a completely arbitrary number but something in the range 0.1 to 0.5 would seem right
1770
1771                                 $aResult['name'] = $aResult['langaddress'];
1772                                 // secondary ordering (for results with same importance (the smaller the better):
1773                                 //   - approximate importance of address parts
1774                                 $aResult['foundorder'] = -$aResult['addressimportance']/10;
1775                                 //   - number of exact matches from the query
1776                                 if (isset($this->exactMatchCache[$aResult['place_id']]))
1777                                         $aResult['foundorder'] -= $this->exactMatchCache[$aResult['place_id']];
1778                                 else if (isset($this->exactMatchCache[$aResult['parent_place_id']]))
1779                                         $aResult['foundorder'] -= $this->exactMatchCache[$aResult['parent_place_id']];
1780                                 //  - importance of the class/type
1781                                 if (isset($aClassType[$aResult['class'].':'.$aResult['type']]['importance'])
1782                                         && $aClassType[$aResult['class'].':'.$aResult['type']]['importance'])
1783                                 {
1784                                         $aResult['foundorder'] += 0.0001 * $aClassType[$aResult['class'].':'.$aResult['type']]['importance'];
1785                                 }
1786                                 else
1787                                 {
1788                                         $aResult['foundorder'] += 0.01;
1789                                 }
1790                                 if (CONST_Debug) { var_dump($aResult); }
1791                                 $aSearchResults[$iResNum] = $aResult;
1792                         }
1793                         uasort($aSearchResults, 'byImportance');
1794
1795                         $aOSMIDDone = array();
1796                         $aClassTypeNameDone = array();
1797                         $aToFilter = $aSearchResults;
1798                         $aSearchResults = array();
1799
1800                         $bFirst = true;
1801                         foreach($aToFilter as $iResNum => $aResult)
1802                         {
1803                                 $this->aExcludePlaceIDs[$aResult['place_id']] = $aResult['place_id'];
1804                                 if ($bFirst)
1805                                 {
1806                                         $fLat = $aResult['lat'];
1807                                         $fLon = $aResult['lon'];
1808                                         if (isset($aResult['zoom'])) $iZoom = $aResult['zoom'];
1809                                         $bFirst = false;
1810                                 }
1811                                 if (!$this->bDeDupe || (!isset($aOSMIDDone[$aResult['osm_type'].$aResult['osm_id']])
1812                                                         && !isset($aClassTypeNameDone[$aResult['osm_type'].$aResult['class'].$aResult['type'].$aResult['name'].$aResult['admin_level']])))
1813                                 {
1814                                         $aOSMIDDone[$aResult['osm_type'].$aResult['osm_id']] = true;
1815                                         $aClassTypeNameDone[$aResult['osm_type'].$aResult['class'].$aResult['type'].$aResult['name'].$aResult['admin_level']] = true;
1816                                         $aSearchResults[] = $aResult;
1817                                 }
1818
1819                                 // Absolute limit on number of results
1820                                 if (sizeof($aSearchResults) >= $this->iFinalLimit) break;
1821                         }
1822
1823                         return $aSearchResults;
1824
1825                 } // end lookup()
1826
1827
1828         } // end class
1829