diff --git a/settings/icu_tokenizer.yaml b/settings/icu_tokenizer.yaml index 5fd30bd8..c0c8c043 100644 --- a/settings/icu_tokenizer.yaml +++ b/settings/icu_tokenizer.yaml @@ -1,5 +1,6 @@ normalization: - ":: lower ()" + - ":: Hans-Hant" - !include icu-rules/unicode-digits-to-decimal.yaml - "'№' > 'no'" - "'n°' > 'no'"