From: Sarah Hoffmann Date: Mon, 31 Mar 2025 09:06:21 +0000 (+0200) Subject: more agressively reduce expected count for multi-word terms X-Git-Url: https://git.openstreetmap.org./nominatim.git/commitdiff_plain/51847ebfeb204c9fe7e133617304fb702698ae12 more agressively reduce expected count for multi-word terms Improves searching of non-latin scripts with forced token spaces. --- diff --git a/src/nominatim_api/search/db_search_builder.py b/src/nominatim_api/search/db_search_builder.py index ddfddaa6..fdf9e2f8 100644 --- a/src/nominatim_api/search/db_search_builder.py +++ b/src/nominatim_api/search/db_search_builder.py @@ -208,7 +208,7 @@ class SearchBuilder: addr_partials = [t for r in address for t in self.query.get_partials_list(r)] addr_tokens = list({t.token for t in addr_partials}) - exp_count = min(t.count for t in name_partials.values()) / (2**(len(name_partials) - 1)) + exp_count = min(t.count for t in name_partials.values()) / (3**(len(name_partials) - 1)) if (len(name_partials) > 3 or exp_count < 8000): yield penalty, exp_count, dbf.lookup_by_names(list(name_partials.keys()), addr_tokens)