factor out housenumber splitting into sanitizer

This commit is contained in:
Sarah Hoffmann
2022-01-07 22:41:09 +01:00
parent a7e048484b
commit 206ee87188
4 changed files with 118 additions and 23 deletions

View File

@@ -27,6 +27,7 @@ transliteration:
sanitizers:
- step: split-name-list
- step: strip-brace-terms
- step: clean-housenumbers
- step: tag-analyzer-by-language
filter-kind: [".*name.*"]
whitelist: [bg,ca,cs,da,de,el,en,es,et,eu,fi,fr,gl,hu,it,ja,mg,ms,nl,no,pl,pt,ro,ru,sk,sl,sv,tr,uk,vi]