2023-03-02 14:45:55 +03:00
|
|
|
#!/usr/bin/env python3
|
|
|
|
|
|
|
|
# Copyright (C) 2023 Yubico.
|
|
|
|
#
|
|
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
# you may not use this file except in compliance with the License.
|
|
|
|
# You may obtain a copy of the License at
|
|
|
|
#
|
|
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
#
|
|
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
# See the License for the specific language governing permissions and
|
|
|
|
# limitations under the License.
|
|
|
|
|
|
|
|
|
|
|
|
import json
|
2023-11-02 17:24:18 +03:00
|
|
|
import os
|
|
|
|
import sys
|
2023-03-02 14:45:55 +03:00
|
|
|
|
2024-04-11 15:48:24 +03:00
|
|
|
non_words = (":",)
|
2023-03-02 14:45:55 +03:00
|
|
|
errors = []
|
|
|
|
|
|
|
|
|
|
|
|
def check_duplicate_keys(pairs):
|
|
|
|
seen = set()
|
|
|
|
for d in [k for k, v in pairs if k in seen or seen.add(k)]:
|
|
|
|
errors.append(f"Duplicate key: {d}")
|
|
|
|
return dict(pairs)
|
|
|
|
|
|
|
|
|
|
|
|
def check_duplicate_values(strings):
|
|
|
|
seen = {}
|
|
|
|
for k, v in strings.items():
|
|
|
|
if isinstance(v, str):
|
|
|
|
if v in seen:
|
|
|
|
errors.append(
|
|
|
|
f"Duplicate value in key: {k} (originally in {seen[v]}): {v}"
|
|
|
|
)
|
|
|
|
else:
|
|
|
|
seen[v] = k
|
|
|
|
|
|
|
|
|
2023-11-02 18:13:08 +03:00
|
|
|
def check_prefixes(k, v, s_max_words, s_max_len, p_ending_chars, q_ending_chars):
|
2023-03-02 14:45:55 +03:00
|
|
|
errs = []
|
|
|
|
if k.startswith("s_"):
|
|
|
|
if len(v) > s_max_len:
|
|
|
|
errs.append(f"Too long ({len(v)} chars)")
|
2024-04-11 15:48:24 +03:00
|
|
|
n_words = len([w for w in v.split() if w not in non_words])
|
|
|
|
if n_words > s_max_words:
|
|
|
|
errs.append(f"Too many words ({n_words})")
|
2023-03-02 16:20:47 +03:00
|
|
|
if k.startswith("l_") or k.startswith("s_"):
|
2023-03-02 14:45:55 +03:00
|
|
|
if v.endswith("."):
|
|
|
|
errs.append("Ends with '.'")
|
|
|
|
if ". " in v:
|
|
|
|
errs.append("Spans multiple sentences")
|
|
|
|
elif k.startswith("p_"):
|
2023-11-02 18:13:08 +03:00
|
|
|
if p_ending_chars and not any(v.endswith(p) for p in p_ending_chars):
|
2023-03-02 14:45:55 +03:00
|
|
|
errs.append("Doesn't end in punctuation")
|
|
|
|
elif k.startswith("q_"):
|
2023-11-02 18:13:08 +03:00
|
|
|
if q_ending_chars and not any(v.endswith(q) for q in q_ending_chars):
|
2023-11-02 17:20:31 +03:00
|
|
|
errs.append("Doesn't end in question mark.")
|
2023-03-02 14:45:55 +03:00
|
|
|
return errs
|
|
|
|
|
|
|
|
|
|
|
|
def check_misc(k, v):
|
|
|
|
errs = []
|
|
|
|
if "..." in v:
|
|
|
|
errs.append("'...' should be replaced with '\\u2026'")
|
2024-09-06 09:52:35 +03:00
|
|
|
if v[0].upper() != v[0]:
|
2023-03-02 16:20:47 +03:00
|
|
|
errs.append("Starts with lowercase letter")
|
2023-03-02 14:45:55 +03:00
|
|
|
return errs
|
|
|
|
|
|
|
|
|
2023-11-02 17:24:18 +03:00
|
|
|
def check_keys_exist_in_reference(reference_strings, checked_strings):
|
|
|
|
errs = []
|
|
|
|
for key in checked_strings.keys():
|
|
|
|
if key not in reference_strings:
|
|
|
|
errs.append(f"Invalid key: {key}")
|
|
|
|
return errs
|
|
|
|
|
|
|
|
|
2023-03-02 14:45:55 +03:00
|
|
|
def lint_strings(strings, rules):
|
|
|
|
for k, v in strings.items():
|
2023-11-02 16:56:17 +03:00
|
|
|
if v is None:
|
|
|
|
continue
|
2023-03-02 14:45:55 +03:00
|
|
|
errs = []
|
|
|
|
errs.extend(
|
|
|
|
check_prefixes(
|
|
|
|
k,
|
|
|
|
v,
|
|
|
|
rules.get("s_max_words", 4),
|
2024-04-11 15:48:24 +03:00
|
|
|
rules.get("s_max_length", 32),
|
2023-11-02 18:13:08 +03:00
|
|
|
rules.get("p_ending_chars", ".!"),
|
|
|
|
rules.get("q_ending_chars", "?"),
|
2023-03-02 14:45:55 +03:00
|
|
|
)
|
|
|
|
)
|
|
|
|
errs.extend(check_misc(k, v))
|
|
|
|
if errs:
|
|
|
|
errors.append(f'Errors in {k}: "{v}"')
|
|
|
|
errors.extend([f" {e}" for e in errs])
|
|
|
|
|
|
|
|
|
|
|
|
if len(sys.argv) != 2:
|
|
|
|
print("USAGE: check_strings.py <ARB_FILE>")
|
|
|
|
sys.exit(1)
|
|
|
|
|
|
|
|
|
|
|
|
target = sys.argv[1]
|
2023-11-30 17:15:59 +03:00
|
|
|
with open(target, encoding="utf-8") as f:
|
2023-03-02 14:45:55 +03:00
|
|
|
values = json.load(f, object_pairs_hook=check_duplicate_keys)
|
|
|
|
|
|
|
|
strings = {k: v for k, v in values.items() if not k.startswith("@")}
|
|
|
|
|
2023-03-02 16:20:47 +03:00
|
|
|
print(target, f"- checking {len(strings)} strings")
|
2023-11-02 16:59:44 +03:00
|
|
|
lint_strings(strings, values.get("@_lint_rules", {}))
|
2023-03-02 16:20:47 +03:00
|
|
|
check_duplicate_values(strings)
|
2023-03-02 14:45:55 +03:00
|
|
|
|
2023-11-30 17:15:59 +03:00
|
|
|
with open(os.path.join(os.path.dirname(target), "app_en.arb"), encoding="utf-8") as f:
|
2023-11-02 17:24:18 +03:00
|
|
|
reference_values = json.load(f)
|
|
|
|
errors.extend(check_keys_exist_in_reference(reference_values, values))
|
|
|
|
|
|
|
|
|
2023-03-02 14:45:55 +03:00
|
|
|
if errors:
|
2023-03-02 16:20:47 +03:00
|
|
|
print()
|
|
|
|
print(target, "HAS ERRORS:")
|
2023-03-02 14:45:55 +03:00
|
|
|
for e in errors:
|
|
|
|
print(e)
|
2023-03-02 16:20:47 +03:00
|
|
|
print()
|
2023-03-02 14:45:55 +03:00
|
|
|
sys.exit(1)
|
|
|
|
|
2023-03-02 16:20:47 +03:00
|
|
|
print(target, "OK")
|