Merge remote-tracking branch 'upstream/master'

author Sarah Hoffmann <lonvia@denofr.de>

Sat, 22 Aug 2020 15:04:58 +0000 (17:04 +0200)

committer Sarah Hoffmann <lonvia@denofr.de>

Sat, 22 Aug 2020 15:04:58 +0000 (17:04 +0200)
author Sarah Hoffmann <lonvia@denofr.de>
Sat, 22 Aug 2020 15:04:58 +0000 (17:04 +0200)
committer Sarah Hoffmann <lonvia@denofr.de>
Sat, 22 Aug 2020 15:04:58 +0000 (17:04 +0200)
diff --git a/docs/admin/Advanced-Installations.md b/docs/admin/Advanced-Installations.md

index 3d750dcc8ee06cf39087c9e755ea992f1d5ea478..7ff5619824674af87c74f9f5a036b286f61eb5ac 100644 (file)
--- a/docs/admin/Advanced-Installations.md
+++ b/docs/admin/Advanced-Installations.md
@@ -63,7 +63,7 @@ Run the following command from your Nominatim directory after configuring the fi
          This file uses osmium-tool. It must be installed before executing the import script.
          Installation instructions can be found [here](https://osmcode.org/osmium-tool/manual.html#installation).
  
-## Updating multiple regions
+### Updating multiple regions
  
  To import multiple regions in your database, you need to configure and run ```utils/update_database.sh```.
  This uses the update directory set up while setting up the DB.   
@@ -103,7 +103,69 @@ Run the following command from your Nominatim directory after configuring the fi
  
  This will get diffs from the replication server, import diffs and index the database. The default replication server in the script([Geofabrik](https://download.geofabrik.de)) provides daily updates.
  
-## Verification and further setup
+## Importing Nominatim to an external PostgreSQL database
  
-Instructions for import verification and other details like importing Wikidata can be found in the [import section](Import.md)
+You can install Nominatim using a database that runs on a different server when
+you have physical access to the file system on the other server. Nominatim
+uses a custom normalization library that needs to be made accessible to the
+PostgreSQL server. This section explains how to set up the normalization
+library.
  
+### Option 1: Compiling the library on the database server
+
+The most sure way to get a working library is to compile it on the database
+server. From the prerequisites you need at least cmake, gcc and the
+PostgreSQL server package.
+
+Clone or unpack the Nominatim source code, enter the source directory and
+create and enter a build directory.
+
+```sh
+cd Nominatim
+mkdir build
+cd build
+```
+
+Now configure cmake to only build the PostgreSQL module and build it:
+
+```
+cmake -DBUILD_IMPORTER=off -DBUILD_API=off -DBUILD_TESTS=off -DBUILD_DOCS=off -DBUILD_OSM2PGSQL=off ..
+make
+```
+
+When done, you find the normalization library in `build/module/nominatim.so`.
+Copy it to a place where it is readable and executable by the PostgreSQL server
+process.
+
+### Option 2: Compiling the library on the import machine
+
+You can also compile the normalization library on the machine from where you
+run the import.
+
+!!! important
+    You can only do this when the database server and the import machine have
+    the same architecture and run the same version of Linux. Otherwise there is
+    no guarantee that the compiled library is compatible with the PostgreSQL
+    server running on the database server.
+
+Make sure that the PostgreSQL server package is installed on the machine
+**with the same version as on the database server**. You do not need to install
+the PostgreSQL server itself.
+
+Download and compile Nominatim as per standard instructions. Once done, you find
+the nomrmalization library in `build/module/nominatim.so`. Copy the file to
+the database server at a location where it is readable and executable by the
+PostgreSQL server process.
+
+### Running the import
+
+On the client side you now need to configure the import to point to the
+correct location of the library **on the database server**. Add the following
+line to your your `settings/local.php` file:
+
+```php
+@define('CONST_Database_Module_Path', '<directory on the database server where nominatim.so resides>');
+```
+
+Now change the `CONST_Database_DSN` to point to your remote server and continue
+to follow the [standard instructions for importing](/admin/Import).
diff --git a/docs/admin/Migration.md b/docs/admin/Migration.md

index 0400ed43aaf2e720a5ebefb4ab60dbf56e267706..917d37859d1a7e7bdb0a7ee142343df988536b92 100644 (file)
--- a/docs/admin/Migration.md
+++ b/docs/admin/Migration.md
@@ -8,6 +8,23 @@ SQL statements should be executed from the PostgreSQL commandline. Execute
  
  ## 3.5.0 -> master
  
+### Change order during indexing
+
+When reindexing places during updates, there is now a different order used
+which needs a different database index. Create it with the following SQL command:
+
+```sql
+CREATE INDEX idx_placex_pendingsector_rank_address
+  ON placex USING BTREE (rank_address, geometry_sector) where indexed_status > 0;
+```
+
+You can then drop the old index with:
+
+```sql
+DROP INDEX idx_placex_pendingsector
+```
+
+
  ### Switching to dotenv
  
  As part of the work changing the configuration format, the configuration for
diff --git a/lib/setup/SetupClass.php b/lib/setup/SetupClass.php

index ba700a2cde9e305f11880e9a28e7795cac24e687..2815f8c4b11a120bad4746776a7b6006ffc392db 100755 (executable)
--- a/lib/setup/SetupClass.php
+++ b/lib/setup/SetupClass.php
@@ -566,19 +566,27 @@ class SetupFunctions
          info('Index ranks 0 - 4');
          $oCmd = (clone $oBaseCmd)->addParams('--maxrank', 4);
          echo $oCmd->escapedCmd();
-        
+
          $iStatus = $oCmd->run();
          if ($iStatus != 0) {
              fail('error status ' . $iStatus . ' running nominatim!');
          }
          if (!$bIndexNoanalyse) $this->pgsqlRunScript('ANALYSE');
  
+        info('Index administrative boundaries');
+        $oCmd = (clone $oBaseCmd)->addParams('-b');
+        $iStatus = $oCmd->run();
+        if ($iStatus != 0) {
+            fail('error status ' . $iStatus . ' running nominatim!');
+        }
+
          info('Index ranks 5 - 25');
          $oCmd = (clone $oBaseCmd)->addParams('--minrank', 5, '--maxrank', 25);
          $iStatus = $oCmd->run();
          if ($iStatus != 0) {
              fail('error status ' . $iStatus . ' running nominatim!');
          }
+
          if (!$bIndexNoanalyse) $this->pgsqlRunScript('ANALYSE');
  
          info('Index ranks 26 - 30');
diff --git a/nominatim/indexer/db.py b/nominatim/indexer/db.py

new file mode 100644 (file)

index 0000000..037c3fb
--- /dev/null
+++ b/nominatim/indexer/db.py
@@ -0,0 +1,112 @@
+# SPDX-License-Identifier: GPL-2.0-only
+#
+# This file is part of Nominatim.
+# Copyright (C) 2020 Sarah Hoffmann
+
+import logging
+import psycopg2
+from psycopg2.extras import wait_select
+
+log = logging.getLogger()
+
+def make_connection(options, asynchronous=False):
+    params = {'dbname' : options.dbname,
+              'user' : options.user,
+              'password' : options.password,
+              'host' : options.host,
+              'port' : options.port,
+              'async' : asynchronous}
+
+    return psycopg2.connect(**params)
+
+class DBConnection(object):
+    """ A single non-blocking database connection.
+    """
+
+    def __init__(self, options):
+        self.current_query = None
+        self.current_params = None
+        self.options = options
+
+        self.conn = None
+        self.connect()
+
+    def connect(self):
+        """ (Re)connect to the database. Creates an asynchronous connection
+            with JIT and parallel processing disabled. If a connection was
+            already open, it is closed and a new connection established.
+            The caller must ensure that no query is pending before reconnecting.
+        """
+        if self.conn is not None:
+            self.cursor.close()
+            self.conn.close()
+
+        self.conn = make_connection(self.options, asynchronous=True)
+        self.wait()
+
+        self.cursor = self.conn.cursor()
+        # Disable JIT and parallel workers as they are known to cause problems.
+        # Update pg_settings instead of using SET because it does not yield
+        # errors on older versions of Postgres where the settings are not
+        # implemented.
+        self.perform(
+            """ UPDATE pg_settings SET setting = -1 WHERE name = 'jit_above_cost';
+                UPDATE pg_settings SET setting = 0 
+                   WHERE name = 'max_parallel_workers_per_gather';""")
+        self.wait()
+
+    def wait(self):
+        """ Block until any pending operation is done.
+        """
+        while True:
+            try:
+                wait_select(self.conn)
+                self.current_query = None
+                return
+            except psycopg2.extensions.TransactionRollbackError as e:
+                if e.pgcode == '40P01':
+                    log.info("Deadlock detected (params = {}), retry."
+                              .format(self.current_params))
+                    self.cursor.execute(self.current_query, self.current_params)
+                else:
+                    raise
+            except psycopg2.errors.DeadlockDetected:
+                self.cursor.execute(self.current_query, self.current_params)
+
+    def perform(self, sql, args=None):
+        """ Send SQL query to the server. Returns immediately without
+            blocking.
+        """
+        self.current_query = sql
+        self.current_params = args
+        self.cursor.execute(sql, args)
+
+    def fileno(self):
+        """ File descriptor to wait for. (Makes this class select()able.)
+        """
+        return self.conn.fileno()
+
+    def is_done(self):
+        """ Check if the connection is available for a new query.
+
+            Also checks if the previous query has run into a deadlock.
+            If so, then the previous query is repeated.
+        """
+        if self.current_query is None:
+            return True
+
+        try:
+            if self.conn.poll() == psycopg2.extensions.POLL_OK:
+                self.current_query = None
+                return True
+        except psycopg2.extensions.TransactionRollbackError as e:
+            if e.pgcode == '40P01':
+                log.info("Deadlock detected (params = {}), retry.".format(self.current_params))
+                self.cursor.execute(self.current_query, self.current_params)
+            else:
+                raise
+        except psycopg2.errors.DeadlockDetected:
+            self.cursor.execute(self.current_query, self.current_params)
+
+        return False
+
diff --git a/nominatim/nominatim.py b/nominatim/nominatim.py

index e8600ca8dc41bb69cd19491c8a2b5abc01c302d1..f46af9ffa6d652060d1221da83bfc4b8f2ef00b3 100755 (executable)
--- a/nominatim/nominatim.py
+++ b/nominatim/nominatim.py
@@ -28,25 +28,13 @@ import sys
  import re
  import getpass
  from datetime import datetime
-import psycopg2
-from psycopg2.extras import wait_select
  import select
  
  from indexer.progress import ProgressLogger
+from indexer.db import DBConnection, make_connection
  
  log = logging.getLogger()
  
-def make_connection(options, asynchronous=False):
-    params = {'dbname' : options.dbname,
-              'user' : options.user,
-              'password' : options.password,
-              'host' : options.host,
-              'port' : options.port,
-              'async' : asynchronous}
-
-    return psycopg2.connect(**params)
-
-
  class RankRunner(object):
      """ Returns SQL commands for indexing one rank within the placex table.
      """
@@ -59,12 +47,12 @@ class RankRunner(object):
  
      def sql_count_objects(self):
          return """SELECT count(*) FROM placex
-                  WHERE rank_search = {} and indexed_status > 0
+                  WHERE rank_address = {} and indexed_status > 0
                 """.format(self.rank)
  
      def sql_get_objects(self):
          return """SELECT place_id FROM placex
-                  WHERE indexed_status > 0 and rank_search = {}
+                  WHERE indexed_status > 0 and rank_address = {}
                    ORDER BY geometry_sector""".format(self.rank)
  
      def sql_index_place(self, ids):
@@ -94,113 +82,62 @@ class InterpolationRunner(object):
                    SET indexed_status = 0 WHERE place_id IN ({})"""\
                 .format(','.join((str(i) for i in ids)))
  
-
-class DBConnection(object):
-    """ A single non-blocking database connection.
+class BoundaryRunner(object):
+    """ Returns SQL commands for indexing the administrative boundaries
+        of a certain rank.
      """
  
-    def __init__(self, options):
-        self.current_query = None
-        self.current_params = None
-
-        self.conn = None
-        self.connect()
-
-    def connect(self):
-        if self.conn is not None:
-            self.cursor.close()
-            self.conn.close()
-
-        self.conn = make_connection(options, asynchronous=True)
-        self.wait()
-
-        self.cursor = self.conn.cursor()
-        # Disable JIT and parallel workers as they are known to cause problems.
-        # Update pg_settings instead of using SET because it does not yield
-        # errors on older versions of Postgres where the settings are not
-        # implemented.
-        self.perform(
-            """ UPDATE pg_settings SET setting = -1 WHERE name = 'jit_above_cost';
-                UPDATE pg_settings SET setting = 0 
-                   WHERE name = 'max_parallel_workers_per_gather';""")
-        self.wait()
-
-    def wait(self):
-        """ Block until any pending operation is done.
-        """
-        while True:
-            try:
-                wait_select(self.conn)
-                self.current_query = None
-                return
-            except psycopg2.extensions.TransactionRollbackError as e:
-                if e.pgcode == '40P01':
-                    log.info("Deadlock detected (params = {}), retry."
-                              .format(self.current_params))
-                    self.cursor.execute(self.current_query, self.current_params)
-                else:
-                    raise
-            except psycopg2.errors.DeadlockDetected:
-                self.cursor.execute(self.current_query, self.current_params)
-
-    def perform(self, sql, args=None):
-        """ Send SQL query to the server. Returns immediately without
-            blocking.
-        """
-        self.current_query = sql
-        self.current_params = args
-        self.cursor.execute(sql, args)
-
-    def fileno(self):
-        """ File descriptor to wait for. (Makes this class select()able.)
-        """
-        return self.conn.fileno()
+    def __init__(self, rank):
+        self.rank = rank
  
-    def is_done(self):
-        """ Check if the connection is available for a new query.
+    def name(self):
+        return "boundaries rank {}".format(self.rank)
  
-            Also checks if the previous query has run into a deadlock.
-            If so, then the previous query is repeated.
-        """
-        if self.current_query is None:
-            return True
-
-        try:
-            if self.conn.poll() == psycopg2.extensions.POLL_OK:
-                self.current_query = None
-                return True
-        except psycopg2.extensions.TransactionRollbackError as e:
-            if e.pgcode == '40P01':
-                log.info("Deadlock detected (params = {}), retry.".format(self.current_params))
-                self.cursor.execute(self.current_query, self.current_params)
-            else:
-                raise
-        except psycopg2.errors.DeadlockDetected:
-            self.cursor.execute(self.current_query, self.current_params)
+    def sql_count_objects(self):
+        return """SELECT count(*) FROM placex
+                  WHERE indexed_status > 0
+                    AND rank_search = {}
+                    AND class = 'boundary' and type = 'administrative'""".format(self.rank)
  
-        return False
+    def sql_get_objects(self):
+        return """SELECT place_id FROM placex
+                  WHERE indexed_status > 0 and rank_search = {}
+                        and class = 'boundary' and type = 'administrative'
+                  ORDER BY partition, admin_level""".format(self.rank)
  
+    def sql_index_place(self, ids):
+        return "UPDATE placex SET indexed_status = 0 WHERE place_id IN ({})"\
+               .format(','.join((str(i) for i in ids)))
  
  class Indexer(object):
      """ Main indexing routine.
      """
  
      def __init__(self, options):
-        self.minrank = max(0, options.minrank)
+        self.minrank = max(1, options.minrank)
          self.maxrank = min(30, options.maxrank)
          self.conn = make_connection(options)
          self.threads = [DBConnection(options) for i in range(options.threads)]
  
-    def run(self):
-        """ Run indexing over the entire database.
+    def index_boundaries(self):
+        log.warning("Starting indexing boundaries using {} threads".format(
+                      len(self.threads)))
+
+        for rank in range(max(self.minrank, 5), min(self.maxrank, 26)):
+            self.index(BoundaryRunner(rank))
+
+    def index_by_rank(self):
+        """ Run classic indexing by rank.
          """
          log.warning("Starting indexing rank ({} to {}) using {} threads".format(
                   self.minrank, self.maxrank, len(self.threads)))
  
-        for rank in range(self.minrank, self.maxrank):
+        for rank in range(max(1, self.minrank), self.maxrank):
              self.index(RankRunner(rank))
  
+
          if self.maxrank == 30:
+            self.index(RankRunner(0), 20)
              self.index(InterpolationRunner(), 20)
  
          self.index(RankRunner(self.maxrank), 20)
@@ -220,27 +157,28 @@ class Indexer(object):
  
          cur.close()
  
-        next_thread = self.find_free_thread()
          progress = ProgressLogger(obj.name(), total_tuples)
  
-        cur = self.conn.cursor(name='places')
-        cur.execute(obj.sql_get_objects())
+        if total_tuples > 0:
+            cur = self.conn.cursor(name='places')
+            cur.execute(obj.sql_get_objects())
  
-        while True:
-            places = [p[0] for p in cur.fetchmany(batch)]
-            if len(places) == 0:
-                break
+            next_thread = self.find_free_thread()
+            while True:
+                places = [p[0] for p in cur.fetchmany(batch)]
+                if len(places) == 0:
+                    break
  
-            log.debug("Processing places: {}".format(places))
-            thread = next(next_thread)
+                log.debug("Processing places: {}".format(places))
+                thread = next(next_thread)
  
-            thread.perform(obj.sql_index_place(places))
-            progress.add(len(places))
+                thread.perform(obj.sql_index_place(places))
+                progress.add(len(places))
  
-        cur.close()
+            cur.close()
  
-        for t in self.threads:
-            t.wait()
+            for t in self.threads:
+                t.wait()
  
          progress.done()
  
@@ -296,6 +234,9 @@ def nominatim_arg_parser():
      p.add_argument('-P', '--port',
                     dest='port', action='store',
                     help='PostgreSQL server port')
+    p.add_argument('-b', '--boundary-only',
+                   dest='boundary_only', action='store_true',
+                   help='Only index administrative boundaries (ignores min/maxrank).')
      p.add_argument('-r', '--minrank',
                     dest='minrank', type=int, metavar='RANK', default=0,
                     help='Minimum/starting rank.')
@@ -323,4 +264,7 @@ if __name__ == '__main__':
          password = getpass.getpass("Database password: ")
          options.password = password
  
-    Indexer(options).run()
+    if options.boundary_only:
+        Indexer(options).index_boundaries()
+    else:
+        Indexer(options).index_by_rank()
diff --git a/settings/import-extratags.style b/settings/import-extratags.style

index b7c5223ba8fdb623c9b9f199df99ce9ea63bfab4..d1ae5511f0c95a8335fa2d01342ff57c0d46162b 100644 (file)
--- a/settings/import-extratags.style
+++ b/settings/import-extratags.style
@@ -76,6 +76,9 @@
          "mini_roundabout" : "skip",
          "noexit" : "skip",
          "crossing" : "skip",
+        "give_way" : "skip",
+        "stop" : "skip",
+        "street_lamp" : "main,with_name",
          "traffic_signals" : "main,with_name",
          "service" : "main,with_name",
          "cycleway" : "main,with_name",
diff --git a/settings/import-full.style b/settings/import-full.style

index e446f18a02ff7555b1ec26775c3cb0e15a2c0bf8..0e2d62e7ca992917a62579a21f8a5dd6af0ff74b 100644 (file)
--- a/settings/import-full.style
+++ b/settings/import-full.style
@@ -76,6 +76,9 @@
          "mini_roundabout" : "skip",
          "noexit" : "skip",
          "crossing" : "skip",
+        "give_way" : "skip",
+        "stop" : "skip",
+        "street_lamp" : "main,with_name",
          "traffic_signals" : "main,with_name",
          "service" : "main,with_name",
          "cycleway" : "main,with_name",
diff --git a/sql/functions/normalization.sql b/sql/functions/normalization.sql

index 66d0214add4f7c1fe9a169bc2231120c94de22d1..1a8bbd84412d8fdb09d3f8291c6b13983afde61e 100644 (file)
--- a/sql/functions/normalization.sql
+++ b/sql/functions/normalization.sql
@@ -207,16 +207,22 @@ CREATE OR REPLACE FUNCTION addr_ids_from_name(lookup_word TEXT)
    AS $$
  DECLARE
    lookup_token TEXT;
+  id INTEGER;
    return_word_id INTEGER[];
  BEGIN
    lookup_token := make_standard_name(lookup_word);
    SELECT array_agg(word_id) FROM word
      WHERE word_token = lookup_token and class is null and type is null
      INTO return_word_id;
+  IF return_word_id IS NULL THEN
+    id := nextval('seq_word');
+    INSERT INTO word VALUES (id, lookup_token, null, null, null, null, 0);
+    return_word_id = ARRAY[id];
+  END IF;
    RETURN return_word_id;
  END;
  $$
-LANGUAGE plpgsql STABLE;
+LANGUAGE plpgsql;
  
  
  -- Normalize a string and look up its name ids (full words).
diff --git a/sql/functions/placex_triggers.sql b/sql/functions/placex_triggers.sql

index f9d5b60f4bbcf1d45b9b0b2d51ccc07c0e9587ca..38b3421f7bff8f7c60a35c337d358c267707e1c1 100644 (file)
--- a/sql/functions/placex_triggers.sql
+++ b/sql/functions/placex_triggers.sql
@@ -574,11 +574,18 @@ BEGIN
           where linked_place_id = NEW.place_id;
    -- update not necessary for osmline, cause linked_place_id does not exist
  
+  NEW.extratags := NEW.extratags - 'linked_place'::TEXT;
+
    IF NEW.linked_place_id is not null THEN
      --DEBUG: RAISE WARNING 'place already linked to %', NEW.linked_place_id;
      RETURN NEW;
    END IF;
  
+  -- Speed up searches - just use the centroid of the feature
+  -- cheaper but less acurate
+  NEW.centroid := ST_PointOnSurface(NEW.geometry);
+  --DEBUG: RAISE WARNING 'Computing preliminary centroid at %',ST_AsText(NEW.centroid);
+
    -- recompute the ranks, they might change when linking changes
    SELECT * INTO NEW.rank_search, NEW.rank_address
      FROM compute_place_rank(NEW.country_code,
@@ -589,8 +596,8 @@ BEGIN
                              (NEW.extratags->'capital') = 'yes',
                              NEW.address->'postcode');
    -- We must always increase the address level relative to the admin boundary.
-  IF NEW.class = 'boundary' and NEW.type = 'administrative' THEN
-    parent_address_level := get_parent_address_level(NEW.geometry, NEW.admin_level);
+  IF NEW.class = 'boundary' and NEW.type = 'administrative' and NEW.osm_type = 'R' THEN
+    parent_address_level := get_parent_address_level(NEW.centroid, NEW.admin_level);
      IF parent_address_level >= NEW.rank_address THEN
        IF parent_address_level >= 24 THEN
          NEW.rank_address := 25;
@@ -630,11 +637,6 @@ BEGIN
        END IF;
    END IF;
  
-  -- Speed up searches - just use the centroid of the feature
-  -- cheaper but less acurate
-  NEW.centroid := ST_PointOnSurface(NEW.geometry);
-  --DEBUG: RAISE WARNING 'Computing preliminary centroid at %',ST_AsText(NEW.centroid);
-
    NEW.postcode := null;
  
    -- recalculate country and partition
@@ -925,10 +927,14 @@ DECLARE
  BEGIN
    -- RAISE WARNING 'placex_delete % %',OLD.osm_type,OLD.osm_id;
  
-  update placex set linked_place_id = null, indexed_status = 2 where linked_place_id = OLD.place_id and indexed_status = 0;
-  --DEBUG: RAISE WARNING 'placex_delete:01 % %',OLD.osm_type,OLD.osm_id;
-  update placex set linked_place_id = null where linked_place_id = OLD.place_id;
-  --DEBUG: RAISE WARNING 'placex_delete:02 % %',OLD.osm_type,OLD.osm_id;
+  IF OLD.linked_place_id is null THEN
+    update placex set linked_place_id = null, indexed_status = 2 where linked_place_id = OLD.place_id and indexed_status = 0;
+    --DEBUG: RAISE WARNING 'placex_delete:01 % %',OLD.osm_type,OLD.osm_id;
+    update placex set linked_place_id = null where linked_place_id = OLD.place_id;
+    --DEBUG: RAISE WARNING 'placex_delete:02 % %',OLD.osm_type,OLD.osm_id;
+  ELSE
+    update placex set indexed_status = 2 where place_id = OLD.linked_place_id and indexed_status = 0;
+  END IF;
  
    IF OLD.rank_address < 30 THEN
  
diff --git a/sql/functions/utils.sql b/sql/functions/utils.sql

index a8c4638cd6405db00a303e25412ff0b0833bff71..6697ff971953a32972521d825a79016e25681f45 100644 (file)
--- a/sql/functions/utils.sql
+++ b/sql/functions/utils.sql
@@ -429,7 +429,7 @@ DECLARE
    geo RECORD;
  BEGIN
    -- 10000000000 is ~~ 1x1 degree
-  FOR geo IN select quad_split_geometry(geometry, 0.25, 20) as geom LOOP
+  FOR geo IN select quad_split_geometry(geometry, 0.01, 20) as geom LOOP
      RETURN NEXT geo.geom;
    END LOOP;
    RETURN;
diff --git a/sql/indices_updates.src.sql b/sql/indices_updates.src.sql

index 175bfba229104fb91639d4fbdd67a7ac1094916a..6d4c968e16bc18ad5cfe0e831161b98f3a85ab0e 100644 (file)
--- a/sql/indices_updates.src.sql
+++ b/sql/indices_updates.src.sql
@@ -1,7 +1,7 @@
  -- Indices used only during search and update.
  -- These indices are created only after the indexing process is done.
  
-CREATE INDEX CONCURRENTLY idx_placex_pendingsector ON placex USING BTREE (rank_search,geometry_sector) {ts:address-index} where indexed_status > 0;
+CREATE INDEX CONCURRENTLY idx_placex_pendingsector ON placex USING BTREE (rank_address,geometry_sector) {ts:address-index} where indexed_status > 0;
  
  CREATE INDEX CONCURRENTLY idx_location_area_country_place_id ON location_area_country USING BTREE (place_id) {ts:address-index};
  
diff --git a/test/bdd/db/import/addressing.feature b/test/bdd/db/import/addressing.feature

index ddb7b438be69e1f7db5fddcdbff7c25c2d89d687..2fdd281286909c7db801708e266c1c5f1dc5d833 100644 (file)
--- a/test/bdd/db/import/addressing.feature
+++ b/test/bdd/db/import/addressing.feature
@@ -81,7 +81,7 @@ Feature: Address computation
              | W1     | W11     |
  
      Scenario: Locality points should contain all boundaries they touch
-        Given the grid
+        Given the 0.001 grid
              | 1 |   |   | 2 |   | 3 |
              |   |   |   | 8 |   |   |
              | 4 |   |   | 5 |   | 6 |
diff --git a/test/bdd/db/import/search_name.feature b/test/bdd/db/import/search_name.feature

index c4e5bbce0ac642d4422454ab56008dd66ac9bbec..8006045fb8082c7f09b72fba9e7644781336a09a 100644 (file)
--- a/test/bdd/db/import/search_name.feature
+++ b/test/bdd/db/import/search_name.feature
@@ -39,13 +39,13 @@ Feature: Creation of search terms
           | object | nameaddress_vector |
           | W1     | bonn, new york, smalltown |
  
-    Scenario: A known addr:* tag is not added if the name is unknown
+    Scenario: A known addr:* tag is added even if the name is unknown
          Given the scene roads-with-pois
          And the places
           | osm | class   | type        | name | addr+city | geometry |
           | W1  | highway | residential | Road | Nandu     | :w-north |
          When importing
-        Then search_name contains not
+        Then search_name contains
           | object | nameaddress_vector |
           | W1     | nandu |
  
diff --git a/test/bdd/db/update/linked_places.feature b/test/bdd/db/update/linked_places.feature

index 647d5eafa1ea37db93585603af4be09a65fd38ea..42e62de57dc27955ab1fca4ddee1ca176c2c2c8f 100644 (file)
--- a/test/bdd/db/update/linked_places.feature
+++ b/test/bdd/db/update/linked_places.feature
@@ -133,3 +133,36 @@ Feature: Updates of linked places
           | object | extratags |
           | R1     | 'wikidata' : '34', 'oneway' : 'yes', 'linked_place' : 'city' |
  
+    Scenario: Remove linked_place info when linkee is removed
+        Given the places
+            | osm | class | type | name | geometry |
+            | N1  | place | city | foo  | 0 0 |
+        And the places
+            | osm | class    | type           | name | admin | geometry |
+            | R1  | boundary | administrative | foo  | 8     | poly-area:0.1 |
+        When importing
+        Then placex contains
+            | object | extratags |
+            | R1     | 'linked_place' : 'city' |
+        When marking for delete N1
+        Then placex contains
+            | object | extratags |
+            | R1     |  |
+
+    Scenario: Update linked_place info when linkee type changes
+        Given the places
+            | osm | class | type | name | geometry |
+            | N1  | place | city | foo  | 0 0 |
+        And the places
+            | osm | class    | type           | name | admin | geometry |
+            | R1  | boundary | administrative | foo  | 8     | poly-area:0.1 |
+        When importing
+        Then placex contains
+            | object | extratags |
+            | R1     | 'linked_place' : 'city' |
+        When updating places
+            | osm | class | type | name | geometry |
+            | N1  | place | town | foo  | 0 0 |
+        Then placex contains
+            | object | extratags |
+            | R1     | 'linked_place' : 'town' |
diff --git a/test/bdd/steps/osm_data.py b/test/bdd/steps/osm_data.py

index 122b246134281bc84e58c50022313f79f6b57d99..bb146ce4d1145f8016318b9e4773299f3e2d29a2 100644 (file)
--- a/test/bdd/steps/osm_data.py
+++ b/test/bdd/steps/osm_data.py
@@ -4,13 +4,13 @@ import random
  import os
  from nose.tools import * # for assert functions
  
-@given(u'the (\d+ )?grid')
+@given(u'the ([0-9.]+ )?grid')
  def define_node_grid(context, grid_step):
      """
      Define a grid of node positions.
      """
      if grid_step is not None:
-        grid_step = int(grd_step.strip())
+        grid_step = float(grid_step.strip())
      else:
          grid_step = 0.00001
  
diff --git a/utils/update.php b/utils/update.php

index db280a621d15364f757cb141e3914ebfc702cdd6..4897aa72f88b0619e53a1bd69063724e4764fd04 100644 (file)
--- a/utils/update.php
+++ b/utils/update.php
@@ -279,9 +279,11 @@ if ($aResult['recompute-word-counts']) {
  
  if ($aResult['index']) {
      $oCmd = (clone $oIndexCmd)
-            ->addParams('--minrank', $aResult['index-rank']);
+            ->addParams('--minrank', $aResult['index-rank'], '-b');
+    $oCmd->run();
  
-    // echo $oCmd->escapedCmd()."\n";
+    $oCmd = (clone $oIndexCmd)
+            ->addParams('--minrank', $aResult['index-rank']);
      $oCmd->run();
  
      $oDB->exec('update import_status set indexed = true');
@@ -422,9 +424,18 @@ if ($aResult['import-osmosis'] || $aResult['import-osmosis-all']) {
  
          // Index file
          if (!$aResult['no-index']) {
-            $oThisIndexCmd = clone($oIndexCmd);
              $fCMDStartTime = time();
  
+            $oThisIndexCmd = clone($oIndexCmd);
+            $oThisIndexCmd->addParams('-b');
+            echo $oThisIndexCmd->escapedCmd()."\n";
+            $iErrorLevel = $oThisIndexCmd->run();
+            if ($iErrorLevel) {
+                echo "Error: $iErrorLevel\n";
+                exit($iErrorLevel);
+            }
+
+            $oThisIndexCmd = clone($oIndexCmd);
              echo $oThisIndexCmd->escapedCmd()."\n";
              $iErrorLevel = $oThisIndexCmd->run();
              if ($iErrorLevel) {
author	Sarah Hoffmann <lonvia@denofr.de>
	Sat, 22 Aug 2020 15:04:58 +0000 (17:04 +0200)
committer	Sarah Hoffmann <lonvia@denofr.de>
	Sat, 22 Aug 2020 15:04:58 +0000 (17:04 +0200)
docs/admin/Advanced-Installations.md		patch \| blob \| history
docs/admin/Migration.md		patch \| blob \| history
lib/setup/SetupClass.php		patch \| blob \| history
nominatim/indexer/db.py	[new file with mode: 0644]	patch \| blob
nominatim/nominatim.py		patch \| blob \| history
settings/import-extratags.style		patch \| blob \| history
settings/import-full.style		patch \| blob \| history
sql/functions/normalization.sql		patch \| blob \| history
sql/functions/placex_triggers.sql		patch \| blob \| history
sql/functions/utils.sql		patch \| blob \| history
sql/indices_updates.src.sql		patch \| blob \| history
test/bdd/db/import/addressing.feature		patch \| blob \| history
test/bdd/db/import/search_name.feature		patch \| blob \| history
test/bdd/db/update/linked_places.feature		patch \| blob \| history
test/bdd/steps/osm_data.py		patch \| blob \| history
utils/update.php		patch \| blob \| history