#!/usr/bin/env python3 import json import os import re import unittest import shutil import tempfile import xml.etree.ElementTree as ET import string import requests from parameterized import parameterized_class from openpilot.selfdrive.ui.update_translations import TRANSLATIONS_DIR, LANGUAGES_FILE, update_translations with open(LANGUAGES_FILE) as f: translation_files = json.load(f) UNFINISHED_TRANSLATION_TAG = "" not in cur_translations, f"{self.file} ({self.name}) translation file has obsolete translations. Run selfdrive/ui/update_translations.py --vanish to remove them") def test_finished_translations(self): """ Tests ran on each translation marked "finished" Plural: - that any numerus (plural) translations have all plural forms non-empty - that the correct format specifier is used (%n) Non-plural: - that translation is not empty - that translation format arguments are consistent """ tr_xml = ET.parse(os.path.join(TRANSLATIONS_DIR, f"{self.file}.ts")) for context in tr_xml.getroot(): for message in context.iterfind("message"): translation = message.find("translation") source_text = message.find("source").text # Do not test unfinished translations if translation.get("type") == "unfinished": continue if message.get("numerus") == "yes": numerusform = [t.text for t in translation.findall("numerusform")] for nf in numerusform: self.assertIsNotNone(nf, f"Ensure all plural translation forms are completed: {source_text}") self.assertIn("%n", nf, "Ensure numerus argument (%n) exists in translation.") self.assertIsNone(FORMAT_ARG.search(nf), f"Plural translations must use %n, not %1, %2, etc.: {numerusform}") else: self.assertIsNotNone(translation.text, f"Ensure translation is completed: {source_text}") source_args = FORMAT_ARG.findall(source_text) translation_args = FORMAT_ARG.findall(translation.text) self.assertEqual(sorted(source_args), sorted(translation_args), f"Ensure format arguments are consistent: `{source_text}` vs. `{translation.text}`") def test_no_locations(self): for line in self._read_translation_file(TRANSLATIONS_DIR, self.file).splitlines(): self.assertFalse(line.strip().startswith(LOCATION_TAG), f"Line contains location tag: {line.strip()}, remove all line numbers.") def test_entities_error(self): cur_translations = self._read_translation_file(TRANSLATIONS_DIR, self.file) matches = re.findall(r'@(\w+);', cur_translations) self.assertEqual(len(matches), 0, f"The string(s) {matches} were found with '@' instead of '&'") def test_bad_language(self): IGNORED_WORDS = {'pédale'} match = re.search(r'_([a-zA-Z]{2,3})', self.file) assert match, f"{self.name} - could not parse language" response = requests.get(f"https://raw.githubusercontent.com/LDNOOBW/List-of-Dirty-Naughty-Obscene-and-Otherwise-Bad-Words/master/{match.group(1)}") response.raise_for_status() banned_words = {line.strip() for line in response.text.splitlines()} for context in ET.parse(os.path.join(TRANSLATIONS_DIR, f"{self.file}.ts")).getroot(): for message in context.iterfind("message"): translation = message.find("translation") if translation.get("type") == "unfinished": continue translation_text = " ".join([t.text for t in translation.findall("numerusform")]) if message.get("numerus") == "yes" else translation.text if not translation_text: continue words = set(translation_text.translate(str.maketrans('', '', string.punctuation + '%n')).lower().split()) bad_words_found = words & (banned_words - IGNORED_WORDS) assert not bad_words_found, f"Bad language found in {self.name}: '{translation_text}'. Bad word(s): {', '.join(bad_words_found)}" if __name__ == "__main__": unittest.main()