Path: blob/development/scripts/manage_languages.py
3153 views
# Written for Python 3.6+1# Older versions don't retain insertion order of regular dicts2import argparse3import cmd4import json5import os6import re7from pprint import pprint89INDENT = 210PRIMARY_LANGUAGE = 'en-US.json'11PRIMARY_FALLBACK_PREFIX = '🇺🇸' # This is invisible in-game, terminal emulators might render it12LANGUAGE_FOLDER = 'src/main/resources/languages/'13LANGUAGE_FILENAMES = sorted(os.listdir(LANGUAGE_FOLDER), key=lambda x: 'AAA' if x == PRIMARY_LANGUAGE else x)14SOURCE_FOLDER = 'src/'15SOURCE_EXTENSIONS = ('java')161718def ppprint(data):19pprint(data, width=130, sort_dicts=False, compact=True)202122class JsonHelpers:23@staticmethod24def load(filename: str) -> dict:25with open(filename, 'r', encoding='utf-8') as file:26return json.load(file)2728@staticmethod29def save(filename: str, data: dict) -> None:30with open(filename, 'w', encoding='utf-8', newline='\n') as file:31json.dump(data, file, ensure_ascii=False, indent=INDENT)32file.write('\n') # json.dump doesn't terminate last line3334@staticmethod35def flatten(data: dict, prefix='') -> dict:36output = {}37for key, value in data.items():38if isinstance(value, dict):39for k,v in JsonHelpers.flatten(value, f'{prefix}{key}.').items():40output[k] = v41else:42output[f'{prefix}{key}'] = value43return output4445@staticmethod46def unflatten(data: dict) -> dict:47output = {}48def add_key(k: list, value, d: dict):49if len(k) == 1:50d[k[0]] = value51else:52d[k[0]] = d.get(k[0], {})53add_key(k[1:], value, d[k[0]])54for key, value in data.items():55add_key(key.split('.'), value, output)56return output5758@staticmethod59def pprint_keys(keys, indent=4) -> str:60# Only strip down to one level61padding = ' ' * indent62roots = {}63for key in keys:64root, _, k = key.rpartition('.')65roots[root] = roots.get(root, [])66roots[root].append(k)67lines = []68for root, ks in roots.items():69if len(ks) > 1:70lines.append(f'{padding}{root}.[{", ".join(ks)}]')71else:72lines.append(f'{padding}{root}.{ks[0]}')73return ',\n'.join(lines)7475@staticmethod76def deep_clone_and_fill(d1: dict, d2: dict, fallback_prefix=PRIMARY_FALLBACK_PREFIX) -> dict:77out = {}78for key, value in d1.items():79if isinstance(value, dict):80out[key] = JsonHelpers.deep_clone_and_fill(value, d2.get(key, {}), fallback_prefix)81else:82v2 = d2.get(key, value)83if type(value) == str and v2 == value:84out[key] = fallback_prefix + value85else:86out[key] = v287return out888990class LanguageManager:91TRANSLATION_KEY = re.compile(r'[Tt]ranslate.*"(\w+\.[\w\.]+)"')92POTENTIAL_KEY = re.compile(r'"(\w+\.[\w\.]+)"')93COMMAND_LABEL = re.compile(r'@Command\s*\([\W\w]*?label\s*=\s*"(\w+)"', re.MULTILINE) # [\W\w] is a cheeky way to match everything including \n9495def __init__(self):96self.load_jsons()9798def load_jsons(self):99self.language_jsons = [JsonHelpers.load(LANGUAGE_FOLDER + filename) for filename in LANGUAGE_FILENAMES]100self.flattened_jsons = [JsonHelpers.flatten(j) for j in self.language_jsons]101self.update_keys()102103def update_keys(self):104self.key_sets = [set(j.keys()) for j in self.flattened_jsons]105self.common_keys = set.intersection(*self.key_sets)106self.all_keys = set.union(*self.key_sets)107self.used_keys = self.find_all_used_keys(self.all_keys)108self.missing_keys = self.used_keys - self.common_keys109self.unused_keys = self.all_keys - self.used_keys110111def find_all_used_keys(self, expected_keys=[]) -> set:112# Note that this will only find string literals passed to the translate() or sendTranslatedMessage() methods!113# String variables passed to them can be checked against expected_keys114used = set()115potential = set()116for root, dirs, files in os.walk(SOURCE_FOLDER):117for file in files:118if file.rpartition('.')[-1] in SOURCE_EXTENSIONS:119filename = os.path.join(root, file)120with open(filename, 'r', encoding='utf-8') as f:121data = f.read() # Loads in entire file at once122for k in self.TRANSLATION_KEY.findall(data):123used.add(k)124for k in self.POTENTIAL_KEY.findall(data):125potential.add(k)126for label in self.COMMAND_LABEL.findall(data):127used.add(f'commands.{label}.description')128return used | (potential & expected_keys)129130def _lint_report_language(self, lang: str, keys: set, flattened: dict, primary_language_flattened: dict) -> None:131missing = self.used_keys - keys132unused = keys - self.used_keys133identical_keys = set() if (lang == PRIMARY_LANGUAGE) else {key for key in keys if primary_language_flattened.get(key, None) == flattened.get(key)}134placeholder_keys = {key for key in keys if flattened.get(key).startswith(PRIMARY_FALLBACK_PREFIX)}135p1 = f'Language {lang} has {len(missing)} missing keys and {len(unused)} unused keys.'136p2 = 'This is the primary language.' if (lang == PRIMARY_LANGUAGE) else f'{len(identical_keys)} match {PRIMARY_LANGUAGE}, {len(placeholder_keys)} have the placeholder mark.'137print(f'{p1} {p2}')138139lint_categories = {140'Missing': missing,141'Unused': unused,142f'Matches {PRIMARY_LANGUAGE}': identical_keys,143'Placeholder': placeholder_keys,144}145for name, category in lint_categories.items():146if len(category) > 0:147print(name + ':')148print(JsonHelpers.pprint_keys(sorted(category)))149150def lint_report(self) -> None:151print(f'There are {len(self.missing_keys)} translation keys in use that are missing from one or more language files.')152print(f'There are {len(self.unused_keys)} translation keys in language files that are not used.')153primary_language_flattened = self.flattened_jsons[LANGUAGE_FILENAMES.index(PRIMARY_LANGUAGE)]154for lang, keys, flattened in zip(LANGUAGE_FILENAMES, self.key_sets, self.flattened_jsons):155print('')156self._lint_report_language(lang, keys, flattened, primary_language_flattened)157158def rename_keys(self, key_remappings: dict) -> None:159# Unfortunately we can't rename keys in-place preserving insertion order, so we have to make new dicts160for i in range(len(self.flattened_jsons)):161self.flattened_jsons[i] = {key_remappings.get(k,k):v for k,v in self.flattened_jsons[i].items()}162163def update_secondary_languages(self):164# Push en_US fallback165primary_language_json = self.language_jsons[LANGUAGE_FILENAMES.index(PRIMARY_LANGUAGE)]166for filename, lang in zip(LANGUAGE_FILENAMES, self.language_jsons):167if filename != PRIMARY_LANGUAGE:168js = JsonHelpers.deep_clone_and_fill(primary_language_json, lang)169JsonHelpers.save(LANGUAGE_FOLDER + filename, js)170171def update_all_languages_from_flattened(self):172for filename, flat in zip(LANGUAGE_FILENAMES, self.flattened_jsons):173JsonHelpers.save(LANGUAGE_FOLDER + filename, JsonHelpers.unflatten(flat))174175def save_flattened_languages(self, prefix='flat_'):176for filename, flat in zip(LANGUAGE_FILENAMES, self.flattened_jsons):177JsonHelpers.save(prefix + filename, flat)178179180class InteractiveRename(cmd.Cmd):181intro = 'Welcome to the interactive rename shell. Type help or ? to list commands.\n'182prompt = '(rename) '183file = None184185def __init__(self, language_manager: LanguageManager) -> None:186super().__init__()187self.language_manager = language_manager188self.flat_keys = [key for key in language_manager.flattened_jsons[LANGUAGE_FILENAMES.index(PRIMARY_LANGUAGE)].keys()]189self.mappings = {}190191def do_add(self, arg):192'''193Prepare to rename an existing translation key. Will not actually rename anything until you confirm all your pending changes with 'rename'.194e.g. a single string: add commands.execution.argument_error commands.generic.invalid.argument195e.g. a group: add commands.enter_dungeon commands.new_enter_dungeon196'''197args = arg.split()198if len(args) < 2:199self.do_help('add')200return201old, new = args[:2]202if old in self.flat_keys:203self.mappings[old] = new204else:205# Check if we are renaming a higher level206if not old.endswith('.'):207old = old + '.'208results = [key for key in self.flat_keys if key.startswith(old)]209if len(results) > 0:210if not new.endswith('.'):211new = new + '.'212new_mappings = {key: key.replace(old, new) for key in results}213# Ask for confirmation214print('Will add the following mappings:')215ppprint(new_mappings)216print('Add these mappings? [y/N]')217if self.prompt_yn():218for k,v in new_mappings.items():219self.mappings[k] = v220else:221print('No translation keys matched!')222223def complete_add(self, text: str, line: str, begidx: int, endidx: int) -> list:224if text == '':225return [k for k in {key.partition('.')[0] for key in self.flat_keys}]226results = [key for key in self.flat_keys if key.startswith(text)]227if len(results) > 40:228# Collapse categories229if text[-1] != '.':230text = text + '.'231level = text.count('.') + 1232new_results = {'.'.join(key.split('.')[:level]) for key in results}233return list(new_results)234return results235236def do_remove(self, arg):237'''238Remove a pending rename mapping. Takes the old name of the key, not the new one.239e.g. a single key: remove commands.execution.argument_error240e.g. a group: remove commands.enter_dungeon241'''242old = arg.split()[0]243if old in self.mappings:244self.mappings.pop(old)245else:246# Check if we are renaming a higher level247if not old.endswith('.'):248old = old + '.'249results = [key for key in self.mappings if key.startswith(old)]250if len(results) > 0:251# Ask for confirmation252print('Will remove the following pending mappings:')253print(JsonHelpers.pprint_keys(results))254print('Delete these mappings? [y/N]')255if self.prompt_yn():256for key in results:257self.mappings.pop(key)258else:259print('No pending rename mappings matched!')260261def complete_remove(self, text: str, line: str, begidx: int, endidx: int) -> list:262return [key for key in self.mappings if key.startswith(text)]263264def do_rename(self, _arg):265'Applies pending renames and overwrites language jsons.'266# Ask for confirmation267print('Will perform the following mappings:')268ppprint(self.mappings)269print('Perform and save these rename mappings? [y/N]')270if self.prompt_yn():271self.language_manager.rename_keys(self.mappings)272self.language_manager.update_all_languages_from_flattened()273print('Renamed keys, closing')274return True275else:276print('Do you instead wish to quit without saving? [yes/N]')277if self.prompt_yn(True):278print('Left rename shell without renaming')279return True280281def prompt_yn(self, strict_yes=False):282if strict_yes:283return input('(yes/N) ').lower() == 'yes'284return input('(y/N) ').lower()[0] == 'y'285286287def main(args: argparse.Namespace):288# print(args)289language_manager = LanguageManager()290errors = None291if args.lint_report:292language_manager.lint_report()293missing = language_manager.used_keys - language_manager.key_sets[LANGUAGE_FILENAMES.index(PRIMARY_LANGUAGE)]294if len(missing) > 0:295errors = f'[ERROR] {len(missing)} keys missing from primary language json!\n{JsonHelpers.pprint_keys(missing)}'296if prefix := args.save_flattened:297language_manager.save_flattened_languages(prefix)298if args.update:299print('Updating secondary languages')300language_manager.update_secondary_languages()301if args.interactive_rename:302language_manager.load_jsons() # Previous actions may have changed them on-disk303try:304InteractiveRename(language_manager).cmdloop()305except KeyboardInterrupt:306print('Left rename shell without renaming')307if errors:308print(errors)309exit(1)310311312313if __name__ == "__main__":314parser = argparse.ArgumentParser(description="Manage Grasscutter's language json files.")315parser.add_argument('-u', '--update', action='store_true',316help=f'Update secondary language files to conform to the layout of the primary language file ({PRIMARY_LANGUAGE}) and contain any new keys from it.')317parser.add_argument('-l', '--lint-report', action='store_true',318help='Prints a lint report, listing unused, missing, and untranslated keys among all language jsons.')319parser.add_argument('-f', '--save-flattened', const='./flat_', metavar='prefix', nargs='?',320help='Save copies of all the language jsons in a flattened key form.')321parser.add_argument('-i', '--interactive-rename', action='store_true',322help='Enter interactive rename mode, in which you can specify keys in flattened form to be renamed.')323args = parser.parse_args()324main(args)325326