X-Git-Url: https://git.openstreetmap.org./nominatim.git/blobdiff_plain/bd2c64876f7ddc99da14ea78a652f797e17134f4..c221e1fd56be892ca13b5a87e248d47d47996cd2:/test/python/api/search/test_db_search_builder.py diff --git a/test/python/api/search/test_db_search_builder.py b/test/python/api/search/test_db_search_builder.py index 9631850e..0e5a8bfc 100644 --- a/test/python/api/search/test_db_search_builder.py +++ b/test/python/api/search/test_db_search_builder.py @@ -332,9 +332,10 @@ def test_name_only_search_with_countries(): assert not search.housenumbers.values -def make_counted_searches(name_part, name_full, address_part, address_full): +def make_counted_searches(name_part, name_full, address_part, address_full, + num_address_parts=1): q = QueryStruct([Phrase(PhraseType.NONE, '')]) - for i in range(2): + for i in range(1 + num_address_parts): q.add_node(BreakType.WORD, PhraseType.NONE) q.add_node(BreakType.END, PhraseType.NONE) @@ -342,15 +343,16 @@ def make_counted_searches(name_part, name_full, address_part, address_full): MyToken(0.5, 1, name_part, 'name_part', True)) q.add_token(TokenRange(0, 1), TokenType.WORD, MyToken(0, 101, name_full, 'name_full', True)) - q.add_token(TokenRange(1, 2), TokenType.PARTIAL, - MyToken(0.5, 2, address_part, 'address_part', True)) - q.add_token(TokenRange(1, 2), TokenType.WORD, - MyToken(0, 102, address_full, 'address_full', True)) + for i in range(num_address_parts): + q.add_token(TokenRange(i + 1, i + 2), TokenType.PARTIAL, + MyToken(0.5, 2, address_part, 'address_part', True)) + q.add_token(TokenRange(i + 1, i + 2), TokenType.WORD, + MyToken(0, 102, address_full, 'address_full', True)) builder = SearchBuilder(q, SearchDetails()) return list(builder.build(TokenAssignment(name=TokenRange(0, 1), - address=[TokenRange(1, 2)]))) + address=[TokenRange(1, 1 + num_address_parts)]))) def test_infrequent_partials_in_name(): @@ -368,7 +370,7 @@ def test_infrequent_partials_in_name(): def test_frequent_partials_in_name_but_not_in_address(): - searches = make_counted_searches(10000, 1, 1, 1) + searches = make_counted_searches(10000, 1, 1, 1, num_address_parts=4) assert len(searches) == 1 search = searches[0] @@ -382,7 +384,7 @@ def test_frequent_partials_in_name_but_not_in_address(): def test_frequent_partials_in_name_and_address(): - searches = make_counted_searches(10000, 1, 10000, 1) + searches = make_counted_searches(9999, 1, 9999, 1) assert len(searches) == 2 @@ -393,3 +395,15 @@ def test_frequent_partials_in_name_and_address(): {('name_vector', 'lookup_any'), ('nameaddress_vector', 'restrict')} assert set((l.column, l.lookup_type) for l in searches[1].lookups) == \ {('nameaddress_vector', 'lookup_all'), ('name_vector', 'lookup_all')} + + +def test_too_frequent_partials_in_name_and_address(): + searches = make_counted_searches(10000, 1, 10000, 1) + + assert len(searches) == 1 + + assert all(isinstance(s, dbs.PlaceSearch) for s in searches) + searches.sort(key=lambda s: s.penalty) + + assert set((l.column, l.lookup_type) for l in searches[0].lookups) == \ + {('name_vector', 'lookup_any'), ('nameaddress_vector', 'restrict')}