X-Git-Url: https://git.openstreetmap.org./nominatim.git/blobdiff_plain/0f196952259baddb77bd1c60ffc3b5ef214da179..041794615320f836ed58511437d29ba0b1379777:/nominatim/db/sqlalchemy_functions.py diff --git a/nominatim/db/sqlalchemy_functions.py b/nominatim/db/sqlalchemy_functions.py index 064fa6a3..6a5809bd 100644 --- a/nominatim/db/sqlalchemy_functions.py +++ b/nominatim/db/sqlalchemy_functions.py @@ -7,27 +7,118 @@ """ Custom functions and expressions for SQLAlchemy. """ +from __future__ import annotations from typing import Any import sqlalchemy as sa -from sqlalchemy.sql.expression import FunctionElement from sqlalchemy.ext.compiler import compiles from nominatim.typing import SaColumn -# pylint: disable=abstract-method,missing-function-docstring,consider-using-f-string +# pylint: disable=all -def select_index_placex_geometry_reverse_lookuppolygon(table: str) -> 'sa.TextClause': - """ Create an expression with the necessary conditions over a placex - table that the index 'idx_placex_geometry_reverse_lookupPolygon' - can be used. +class PlacexGeometryReverseLookuppolygon(sa.sql.functions.GenericFunction[bool]): + """ Check for conditions that allow partial index use on + 'idx_placex_geometry_reverse_lookupPolygon'. + + Needs to be constant, so that the query planner picks them up correctly + in prepared statements. """ - return sa.text(f"ST_GeometryType({table}.geometry) in ('ST_Polygon', 'ST_MultiPolygon')" - f" AND {table}.rank_address between 4 and 25" - f" AND {table}.type != 'postcode'" - f" AND {table}.name is not null" - f" AND {table}.indexed_status = 0" - f" AND {table}.linked_place_id is null") + type = sa.Boolean() + name = 'PlacexGeometryReverseLookuppolygon' + inherit_cache = True + + +@compiles(PlacexGeometryReverseLookuppolygon) # type: ignore[no-untyped-call, misc] +def _default_intersects(element: SaColumn, + compiler: 'sa.Compiled', **kw: Any) -> str: + return ("(ST_GeometryType(placex.geometry) in ('ST_Polygon', 'ST_MultiPolygon')" + " AND placex.rank_address between 4 and 25" + " AND placex.type != 'postcode'" + " AND placex.name is not null" + " AND placex.indexed_status = 0" + " AND placex.linked_place_id is null)") + + +@compiles(PlacexGeometryReverseLookuppolygon, 'sqlite') # type: ignore[no-untyped-call, misc] +def _sqlite_intersects(element: SaColumn, + compiler: 'sa.Compiled', **kw: Any) -> str: + return ("(ST_GeometryType(placex.geometry) in ('POLYGON', 'MULTIPOLYGON')" + " AND placex.rank_address between 4 and 25" + " AND placex.type != 'postcode'" + " AND placex.name is not null" + " AND placex.indexed_status = 0" + " AND placex.linked_place_id is null)") + + +class IntersectsReverseDistance(sa.sql.functions.GenericFunction[bool]): + type = sa.Boolean() + name = 'IntersectsReverseDistance' + inherit_cache = True + + def __init__(self, table: sa.Table, geom: SaColumn) -> None: + super().__init__(table.c.geometry, # type: ignore[no-untyped-call] + table.c.rank_search, geom) + self.tablename = table.name + + +@compiles(IntersectsReverseDistance) # type: ignore[no-untyped-call, misc] +def default_reverse_place_diameter(element: SaColumn, + compiler: 'sa.Compiled', **kw: Any) -> str: + table = element.tablename + return f"{table}.rank_address between 4 and 25"\ + f" AND {table}.type != 'postcode'"\ + f" AND {table}.name is not null"\ + f" AND {table}.linked_place_id is null"\ + f" AND {table}.osm_type = 'N'" + \ + " AND ST_Buffer(%s, reverse_place_diameter(%s)) && %s" % \ + tuple(map(lambda c: compiler.process(c, **kw), element.clauses)) + + +@compiles(IntersectsReverseDistance, 'sqlite') # type: ignore[no-untyped-call, misc] +def sqlite_reverse_place_diameter(element: SaColumn, + compiler: 'sa.Compiled', **kw: Any) -> str: + geom1, rank, geom2 = list(element.clauses) + table = element.tablename + + return (f"{table}.rank_address between 4 and 25"\ + f" AND {table}.type != 'postcode'"\ + f" AND {table}.name is not null"\ + f" AND {table}.linked_place_id is null"\ + f" AND {table}.osm_type = 'N'"\ + " AND MbrIntersects(%s, ST_Expand(%s, 14.0 * exp(-0.2 * %s) - 0.03))"\ + f" AND {table}.place_id IN"\ + " (SELECT place_id FROM placex_place_node_areas"\ + " WHERE ROWID IN (SELECT ROWID FROM SpatialIndex"\ + " WHERE f_table_name = 'placex_place_node_areas'"\ + " AND search_frame = %s))") % ( + compiler.process(geom1, **kw), + compiler.process(geom2, **kw), + compiler.process(rank, **kw), + compiler.process(geom2, **kw)) + + +class IsBelowReverseDistance(sa.sql.functions.GenericFunction[bool]): + type = sa.Boolean() + name = 'IsBelowReverseDistance' + inherit_cache = True + + +@compiles(IsBelowReverseDistance) # type: ignore[no-untyped-call, misc] +def default_is_below_reverse_distance(element: SaColumn, + compiler: 'sa.Compiled', **kw: Any) -> str: + dist, rank = list(element.clauses) + return "%s < reverse_place_diameter(%s)" % (compiler.process(dist, **kw), + compiler.process(rank, **kw)) + + +@compiles(IsBelowReverseDistance, 'sqlite') # type: ignore[no-untyped-call, misc] +def sqlite_is_below_reverse_distance(element: SaColumn, + compiler: 'sa.Compiled', **kw: Any) -> str: + dist, rank = list(element.clauses) + return "%s < 14.0 * exp(-0.2 * %s) - 0.03" % (compiler.process(dist, **kw), + compiler.process(rank, **kw)) + def select_index_placex_geometry_reverse_lookupplacenode(table: str) -> 'sa.TextClause': """ Create an expression with the necessary conditions over a placex @@ -41,10 +132,11 @@ def select_index_placex_geometry_reverse_lookupplacenode(table: str) -> 'sa.Text f" AND {table}.osm_type = 'N'") -class CrosscheckNames(FunctionElement[Any]): +class CrosscheckNames(sa.sql.functions.GenericFunction[bool]): """ Check if in the given list of names in parameters 1 any of the names from the JSON array in parameter 2 are contained. """ + type = sa.Boolean() name = 'CrosscheckNames' inherit_cache = True @@ -54,3 +146,58 @@ def compile_crosscheck_names(element: SaColumn, arg1, arg2 = list(element.clauses) return "coalesce(avals(%s) && ARRAY(SELECT * FROM json_array_elements_text(%s)), false)" % ( compiler.process(arg1, **kw), compiler.process(arg2, **kw)) + + +@compiles(CrosscheckNames, 'sqlite') # type: ignore[no-untyped-call, misc] +def compile_sqlite_crosscheck_names(element: SaColumn, + compiler: 'sa.Compiled', **kw: Any) -> str: + arg1, arg2 = list(element.clauses) + return "EXISTS(SELECT *"\ + " FROM json_each(%s) as name, json_each(%s) as match_name"\ + " WHERE name.value = match_name.value)"\ + % (compiler.process(arg1, **kw), compiler.process(arg2, **kw)) + + +class JsonArrayEach(sa.sql.functions.GenericFunction[Any]): + """ Return elements of a json array as a set. + """ + name = 'JsonArrayEach' + inherit_cache = True + + +@compiles(JsonArrayEach) # type: ignore[no-untyped-call, misc] +def default_json_array_each(element: SaColumn, compiler: 'sa.Compiled', **kw: Any) -> str: + return "json_array_elements(%s)" % compiler.process(element.clauses, **kw) + + +@compiles(JsonArrayEach, 'sqlite') # type: ignore[no-untyped-call, misc] +def sqlite_json_array_each(element: SaColumn, compiler: 'sa.Compiled', **kw: Any) -> str: + return "json_each(%s)" % compiler.process(element.clauses, **kw) + + +class JsonHasKey(sa.sql.functions.GenericFunction[bool]): + """ Return elements of a json array as a set. + """ + type = sa.Boolean() + name = 'JsonHasKey' + inherit_cache = True + + +@compiles(JsonHasKey) # type: ignore[no-untyped-call, misc] +def compile_json_has_key(element: SaColumn, + compiler: 'sa.Compiled', **kw: Any) -> str: + arg1, arg2 = list(element.clauses) + return "%s->%s is not null" % (compiler.process(arg1, **kw), + compiler.process(arg2, **kw)) + + +class Greatest(sa.sql.functions.GenericFunction[Any]): + """ Function to compute maximum of all its input parameters. + """ + name = 'greatest' + inherit_cache = True + + +@compiles(Greatest, 'sqlite') # type: ignore[no-untyped-call, misc] +def sqlite_greatest(element: SaColumn, compiler: 'sa.Compiled', **kw: Any) -> str: + return "max(%s)" % compiler.process(element.clauses, **kw)