From df8c7bb50c01a5bf61aeb840cdf9b80b060b90e9 Mon Sep 17 00:00:00 2001 From: towzeur Date: Mon, 21 Aug 2023 10:28:41 +0200 Subject: [PATCH] add scan_i18n to detect unused and missing keys (#1058) --- scan_i18n.py | 68 ++++++++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 68 insertions(+) create mode 100644 scan_i18n.py diff --git a/scan_i18n.py b/scan_i18n.py new file mode 100644 index 0000000..1f9247d --- /dev/null +++ b/scan_i18n.py @@ -0,0 +1,68 @@ +import ast +import glob +import json + +from collections import OrderedDict + +def extract_i18n_strings(node): + i18n_strings = [] + + if isinstance(node, ast.Call) and isinstance(node.func, ast.Name) and node.func.id == "i18n": + for arg in node.args: + if isinstance(arg, ast.Str): + i18n_strings.append(arg.s) + + for child_node in ast.iter_child_nodes(node): + i18n_strings.extend(extract_i18n_strings(child_node)) + + return i18n_strings + +# scan the directory for all .py files (recursively) +# for each file, parse the code into an AST +# for each AST, extract the i18n strings + +strings = [] +for filename in glob.iglob('**/*.py', recursive=True): + with open(filename, 'r') as f: + code = f.read() + if "I18nAuto" in code: + tree = ast.parse(code) + i18n_strings = extract_i18n_strings(tree) + print(filename, len(i18n_strings)) + strings.extend(i18n_strings) +code_keys = set(strings) +''' +n_i18n.py +gui_v1.py 26 +app.py 16 +infer-web.py 147 +scan_i18n.py 0 +i18n.py 0 +lib/train/process_ckpt.py 1 +''' +print() +print('Total unique:', len(code_keys)) + + + +standard_file = "zh_CN.json" +with open(f"lib/i18n/{standard_file}", "r", encoding="utf-8") as f: + standard_data = json.load(f, object_pairs_hook=OrderedDict) +standard_keys = set(standard_data.keys()) + +# Define the standard file name +unused_keys = standard_keys - code_keys +print('Unused keys:', len(unused_keys)) +for unused_key in unused_keys: + print('\t', unused_key) + +missing_keys = code_keys - standard_keys +print('Missing keys:', len(missing_keys)) +for missing_key in missing_keys: + print('\t', missing_key) + + + + + +