From b7d4ff3201376126d9b4979fffe6b4521469d861 Mon Sep 17 00:00:00 2001 From: Sarah Hoffmann Date: Tue, 31 Aug 2021 11:18:34 +0200 Subject: [PATCH] icu: normalise simplified to traditional chinese The conversion is unambigious in most cases, so that the information loss is minimal. --- settings/icu_tokenizer.yaml | 1 + 1 file changed, 1 insertion(+) diff --git a/settings/icu_tokenizer.yaml b/settings/icu_tokenizer.yaml index 5fd30bd8..c0c8c043 100644 --- a/settings/icu_tokenizer.yaml +++ b/settings/icu_tokenizer.yaml @@ -1,5 +1,6 @@ normalization: - ":: lower ()" + - ":: Hans-Hant" - !include icu-rules/unicode-digits-to-decimal.yaml - "'№' > 'no'" - "'n°' > 'no'"