From: Sarah Hoffmann Date: Fri, 10 Jan 2025 19:58:34 +0000 (+0100) Subject: Merge remote-tracking branch 'upstream/master' X-Git-Url: https://git.openstreetmap.org./nominatim.git/commitdiff_plain/7f87cd1806e6e51ba9ff0613d00f622140dd248e?hp=--cc Merge remote-tracking branch 'upstream/master' --- 7f87cd1806e6e51ba9ff0613d00f622140dd248e diff --cc src/nominatim_api/search/icu_tokenizer.py index ac78d03c,6f1dcf79..8f2069c1 --- a/src/nominatim_api/search/icu_tokenizer.py +++ b/src/nominatim_api/search/icu_tokenizer.py @@@ -164,14 -206,10 +206,16 @@@ class ICUQueryAnalyzer(AbstractQueryAna tokenized query. """ log().section('Analyze query (using ICU tokenizer)') - normalized = list(filter(lambda p: p.text, - (qmod.Phrase(p.ptype, self.normalize_text(p.text)) - for p in phrases))) - if len(normalized) == 1 \ - and normalized[0].text.count(' ') > 3 \ - and max(len(s) for s in normalized[0].text.split()) < 3: + for func in self.preprocessors: + phrases = func(phrases) ++ ++ if len(phrases) == 1 \ ++ and phrases[0].text.count(' ') > 3 \ ++ and max(len(s) for s in phrases[0].text.split()) < 3: + normalized = [] - query = qmod.QueryStruct(normalized) ++ + query = qmod.QueryStruct(phrases) + log().var_dump('Normalized query', query.source) if not query.source: return query