add japanese sanitizer

This commit is contained in:
miku0
2023-07-26 07:54:58 +00:00
parent 261e0cfd5a
commit 0722495434
5 changed files with 253 additions and 0 deletions

View File

@@ -45,6 +45,7 @@ sanitizers:
whitelist: [bg,ca,cs,da,de,el,en,es,et,eu,fi,fr,gl,hu,it,ja,mg,ms,nl,no,pl,pt,ro,ru,sk,sl,sv,tr,uk,vi]
use-defaults: all
mode: append
- step: tag-japanese
token-analysis:
- analyzer: generic
- id: "@housenumber"