X-Git-Url: https://git.openstreetmap.org./nominatim.git/blobdiff_plain/3905dd68dd5b261449df7df243c594b25995d8bd..e1dc4379e0cd100200ac53752442143ca4846fc5:/src/nominatim_db/indexer/indexer.py?ds=sidebyside diff --git a/src/nominatim_db/indexer/indexer.py b/src/nominatim_db/indexer/indexer.py index 9d42922b..d467efbd 100644 --- a/src/nominatim_db/indexer/indexer.py +++ b/src/nominatim_db/indexer/indexer.py @@ -21,6 +21,7 @@ from . import runners LOG = logging.getLogger() + class Indexer: """ Main indexing routine. """ @@ -30,7 +31,6 @@ class Indexer: self.tokenizer = tokenizer self.num_threads = num_threads - def has_pending(self) -> bool: """ Check if any data still needs indexing. This function must only be used after the import has finished. @@ -41,7 +41,6 @@ class Indexer: cur.execute("SELECT 'a' FROM placex WHERE indexed_status > 0 LIMIT 1") return cur.rowcount > 0 - async def index_full(self, analyse: bool = True) -> None: """ Index the complete database. This will first index boundaries followed by all other objects. When `analyse` is True, then the @@ -75,7 +74,6 @@ class Indexer: if not self.has_pending(): break - async def index_boundaries(self, minrank: int, maxrank: int) -> int: """ Index only administrative boundaries within the given rank range. """ @@ -138,7 +136,6 @@ class Indexer: (minrank, maxrank)) total_tuples = {row.rank_address: row.count for row in cur} - with self.tokenizer.name_analyzer() as analyzer: for rank in range(max(1, minrank), maxrank + 1): if rank >= 30: @@ -156,7 +153,6 @@ class Indexer: return total - async def index_postcodes(self) -> int: """Index the entries of the location_postcode table. """ @@ -164,7 +160,6 @@ class Indexer: return await self._index(runners.PostcodeRunner(), batch=20) - def update_status_table(self) -> None: """ Update the status in the status table to 'indexed'. """ @@ -193,7 +188,7 @@ class Indexer: if total_tuples > 0: async with await psycopg.AsyncConnection.connect( - self.dsn, row_factory=psycopg.rows.dict_row) as aconn,\ + self.dsn, row_factory=psycopg.rows.dict_row) as aconn, \ QueryPool(self.dsn, self.num_threads, autocommit=True) as pool: fetcher_time = 0.0 tstart = time.time() @@ -224,7 +219,6 @@ class Indexer: return progress.done() - def _prepare_indexing(self, runner: runners.Runner) -> int: with connect(self.dsn) as conn: hstore_info = psycopg.types.TypeInfo.fetch(conn, "hstore")