X-Git-Url: https://git.openstreetmap.org./nominatim.git/blobdiff_plain/fb54bd3fcff5a8a44ae59f0d552ed316b08966b3..3741afa6dc5eced78483b2c2793a8eead0a2396e:/settings/icu_tokenizer.yaml diff --git a/settings/icu_tokenizer.yaml b/settings/icu_tokenizer.yaml index a3c62e67..d00cffb9 100644 --- a/settings/icu_tokenizer.yaml +++ b/settings/icu_tokenizer.yaml @@ -27,6 +27,7 @@ transliteration: sanitizers: - step: split-name-list - step: strip-brace-terms + - step: clean-housenumbers - step: tag-analyzer-by-language filter-kind: [".*name.*"] whitelist: [bg,ca,cs,da,de,el,en,es,et,eu,fi,fr,gl,hu,it,ja,mg,ms,nl,no,pl,pt,ro,ru,sk,sl,sv,tr,uk,vi] @@ -59,6 +60,13 @@ token-analysis: mode: variant-only variants: - !include icu-rules/variants-de.yaml + mutations: + - pattern: ä + replacements: ["ä", "ae"] + - pattern: ö + replacements: ["ö", "oe"] + - pattern: ü + replacements: ["ü", "ue"] - id: el analyzer: generic mode: variant-only