Files
ComfyUI-Lora-Manager/test_i18n.py

987 lines
40 KiB
Python

#!/usr/bin/env python3
"""
Test script to verify the updated i18n system works correctly.
This tests both JavaScript loading and Python server-side functionality.
"""
import os
import sys
import json
import re
import glob
from typing import Set, Dict, List, Tuple, Any
# Add the parent directory to the path so we can import the modules
sys.path.insert(0, os.path.dirname(os.path.dirname(__file__)))
def test_json_files_exist():
"""Test that all JSON locale files exist and are valid JSON."""
print("Testing JSON locale files...")
return test_json_structure_validation()
def test_locale_files_structural_consistency():
"""Test that all locale files have identical structure, line counts, and formatting."""
print("\nTesting locale files structural consistency...")
locales_dir = os.path.join(os.path.dirname(__file__), 'locales')
if not os.path.exists(locales_dir):
print("❌ Locales directory does not exist!")
return False
# Get all locale files
locale_files = []
for file in os.listdir(locales_dir):
if file.endswith('.json'):
locale_files.append(file)
if not locale_files:
print("❌ No locale files found!")
return False
# Use en.json as the reference
reference_file = 'en.json'
if reference_file not in locale_files:
print(f"❌ Reference file {reference_file} not found!")
return False
locale_files.remove(reference_file)
locale_files.insert(0, reference_file) # Put reference first
success = True
# Load and parse the reference file
reference_path = os.path.join(locales_dir, reference_file)
try:
with open(reference_path, 'r', encoding='utf-8') as f:
reference_lines = f.readlines()
reference_content = ''.join(reference_lines)
reference_data = json.loads(reference_content)
reference_structure = get_json_structure(reference_data)
print(f"📋 Reference file {reference_file}:")
print(f" Lines: {len(reference_lines)}")
print(f" Keys: {len(get_all_translation_keys(reference_data))}")
except Exception as e:
print(f"❌ Error reading reference file {reference_file}: {e}")
return False
# Compare each locale file with the reference
for locale_file in locale_files[1:]: # Skip reference file
locale_path = os.path.join(locales_dir, locale_file)
locale_name = locale_file.replace('.json', '')
try:
with open(locale_path, 'r', encoding='utf-8') as f:
locale_lines = f.readlines()
locale_content = ''.join(locale_lines)
locale_data = json.loads(locale_content)
locale_structure = get_json_structure(locale_data)
# Test 1: Line count consistency
if len(locale_lines) != len(reference_lines):
print(f"{locale_name}: Line count mismatch!")
print(f" Reference: {len(reference_lines)} lines")
print(f" {locale_name}: {len(locale_lines)} lines")
success = False
continue
# Test 2: Structural consistency (key order and nesting)
structure_issues = compare_json_structures(reference_structure, locale_structure)
if structure_issues:
print(f"{locale_name}: Structure mismatch!")
for issue in structure_issues[:5]: # Show first 5 issues
print(f" - {issue}")
if len(structure_issues) > 5:
print(f" ... and {len(structure_issues) - 5} more issues")
success = False
continue
# Test 3: Line-by-line format consistency (excluding translation values)
format_issues = compare_line_formats(reference_lines, locale_lines, locale_name)
if format_issues:
print(f"{locale_name}: Format mismatch!")
for issue in format_issues[:5]: # Show first 5 issues
print(f" - {issue}")
if len(format_issues) > 5:
print(f" ... and {len(format_issues) - 5} more issues")
success = False
continue
# Test 4: Key completeness
reference_keys = get_all_translation_keys(reference_data)
locale_keys = get_all_translation_keys(locale_data)
missing_keys = reference_keys - locale_keys
extra_keys = locale_keys - reference_keys
if missing_keys or extra_keys:
print(f"{locale_name}: Key mismatch!")
if missing_keys:
print(f" Missing {len(missing_keys)} keys")
if extra_keys:
print(f" Extra {len(extra_keys)} keys")
success = False
continue
print(f"{locale_name}: Structure and format consistent")
except json.JSONDecodeError as e:
print(f"{locale_name}: Invalid JSON syntax: {e}")
success = False
except Exception as e:
print(f"{locale_name}: Error during validation: {e}")
success = False
if success:
print(f"\n✅ All {len(locale_files)} locale files have consistent structure and formatting")
return success
def get_json_structure(data: Any, path: str = '') -> Dict[str, Any]:
"""
Extract the structural information from JSON data.
Returns a dictionary describing the structure without the actual values.
"""
if isinstance(data, dict):
structure = {}
for key, value in data.items():
current_path = f"{path}.{key}" if path else key
if isinstance(value, dict):
structure[key] = get_json_structure(value, current_path)
elif isinstance(value, list):
structure[key] = {'_type': 'array', '_length': len(value)}
if value: # If array is not empty, analyze first element
structure[key]['_element_type'] = get_json_structure(value[0], f"{current_path}[0]")
else:
structure[key] = {'_type': type(value).__name__}
return structure
elif isinstance(data, list):
return {'_type': 'array', '_length': len(data)}
else:
return {'_type': type(data).__name__}
def compare_json_structures(ref_structure: Dict[str, Any], locale_structure: Dict[str, Any], path: str = '') -> List[str]:
"""
Compare two JSON structures and return a list of differences.
"""
issues = []
# Check for missing keys in locale
for key in ref_structure:
current_path = f"{path}.{key}" if path else key
if key not in locale_structure:
issues.append(f"Missing key: {current_path}")
elif isinstance(ref_structure[key], dict) and '_type' not in ref_structure[key]:
# It's a nested object, recurse
if isinstance(locale_structure[key], dict) and '_type' not in locale_structure[key]:
issues.extend(compare_json_structures(ref_structure[key], locale_structure[key], current_path))
else:
issues.append(f"Structure mismatch at {current_path}: expected object, got {type(locale_structure[key])}")
elif ref_structure[key] != locale_structure[key]:
issues.append(f"Type mismatch at {current_path}: expected {ref_structure[key]}, got {locale_structure[key]}")
# Check for extra keys in locale
for key in locale_structure:
current_path = f"{path}.{key}" if path else key
if key not in ref_structure:
issues.append(f"Extra key: {current_path}")
return issues
def extract_line_structure(line: str) -> Dict[str, str]:
"""
Extract structural elements from a JSON line.
Returns indentation, key (if present), and structural characters.
"""
# Get indentation (leading whitespace)
indentation = len(line) - len(line.lstrip())
# Remove leading/trailing whitespace for analysis
stripped_line = line.strip()
# Extract key if this is a key-value line
key_match = re.match(r'^"([^"]+)"\s*:\s*', stripped_line)
key = key_match.group(1) if key_match else ''
# Extract structural characters (everything except the actual translation value)
if key:
# For key-value lines, extract everything except the value
# Handle string values in quotes with better escaping support
value_pattern = r'^"[^"]+"\s*:\s*("(?:[^"\\]|\\.)*")(.*?)$'
value_match = re.match(value_pattern, stripped_line)
if value_match:
# Preserve the structure but replace the actual string content
structural_chars = f'"{key}": "VALUE"{value_match.group(2)}'
else:
# Handle non-string values (objects, arrays, booleans, numbers)
colon_pos = stripped_line.find(':')
if colon_pos != -1:
after_colon = stripped_line[colon_pos + 1:].strip()
if after_colon.startswith('"'):
# String value - find the end quote with proper escaping
end_quote = find_closing_quote(after_colon, 1)
if end_quote != -1:
structural_chars = f'"{key}": "VALUE"{after_colon[end_quote + 1:]}'
else:
structural_chars = f'"{key}": "VALUE"'
elif after_colon.startswith('{'):
# Object value
structural_chars = f'"{key}": {{'
elif after_colon.startswith('['):
# Array value
structural_chars = f'"{key}": ['
else:
# Other values (numbers, booleans, null)
# Replace the actual value with a placeholder
value_end = find_value_end(after_colon)
structural_chars = f'"{key}": VALUE{after_colon[value_end:]}'
else:
structural_chars = stripped_line
else:
# For non key-value lines (brackets, etc.), keep as-is
structural_chars = stripped_line
return {
'indentation': str(indentation),
'key': key,
'structural_chars': structural_chars
}
def find_value_end(text: str) -> int:
"""
Find the end of a non-string JSON value (number, boolean, null).
"""
for i, char in enumerate(text):
if char in ',}]':
return i
return len(text)
def find_closing_quote(text: str, start: int) -> int:
"""
Find the position of the closing quote, handling escaped quotes properly.
"""
i = start
while i < len(text):
if text[i] == '"':
# Count preceding backslashes
backslash_count = 0
j = i - 1
while j >= 0 and text[j] == '\\':
backslash_count += 1
j -= 1
# If even number of backslashes (including 0), the quote is not escaped
if backslash_count % 2 == 0:
return i
i += 1
return -1
def compare_line_formats(ref_lines: List[str], locale_lines: List[str], locale_name: str) -> List[str]:
"""
Compare line-by-line formatting between reference and locale files.
Only checks structural elements (indentation, brackets, commas) and ignores translation values.
"""
issues = []
for i, (ref_line, locale_line) in enumerate(zip(ref_lines, locale_lines)):
line_num = i + 1
# Skip empty lines and lines with only whitespace
if not ref_line.strip() and not locale_line.strip():
continue
# Extract structural elements from each line
ref_structure = extract_line_structure(ref_line)
locale_structure = extract_line_structure(locale_line)
# Compare structural elements with more tolerance
structure_issues = []
# Check indentation (must be exact)
if ref_structure['indentation'] != locale_structure['indentation']:
structure_issues.append(f"indentation ({ref_structure['indentation']} vs {locale_structure['indentation']})")
# Check keys (must be exact for structural consistency)
if ref_structure['key'] != locale_structure['key']:
structure_issues.append(f"key ('{ref_structure['key']}' vs '{locale_structure['key']}')")
# Check structural characters with improved normalization
ref_normalized = normalize_structural_chars(ref_structure['structural_chars'])
locale_normalized = normalize_structural_chars(locale_structure['structural_chars'])
if ref_normalized != locale_normalized:
# Additional check: if both lines have the same key and similar structure,
# this might be a false positive due to translation content differences
if (ref_structure['key'] and locale_structure['key'] and
ref_structure['key'] == locale_structure['key']):
# Check if the difference is only in the translation value
ref_has_string_value = '"VALUE"' in ref_normalized
locale_has_string_value = '"VALUE"' in locale_normalized
if ref_has_string_value and locale_has_string_value:
# Both have string values, check if structure around value is same
ref_structure_only = re.sub(r'"VALUE"', '"X"', ref_normalized)
locale_structure_only = re.sub(r'"VALUE"', '"X"', locale_normalized)
if ref_structure_only == locale_structure_only:
# Structure is actually the same, skip this as false positive
continue
structure_issues.append(f"structure ('{ref_normalized}' vs '{locale_normalized}')")
if structure_issues:
issues.append(f"Line {line_num}: {', '.join(structure_issues)}")
return issues
def normalize_structural_chars(structural_chars: str) -> str:
"""
Normalize structural characters for comparison by replacing variable content
with placeholders while preserving the actual structure.
"""
# Normalize the structural characters more carefully
normalized = structural_chars
# Replace quoted strings with a consistent placeholder, handling escapes
# This regex matches strings while properly handling escaped quotes
string_pattern = r'"(?:[^"\\]|\\.)*"(?=\s*[,}\]:}]|$)'
# Find all string matches and replace with placeholder
strings = re.findall(string_pattern, normalized)
for string_match in strings:
# Only replace if this looks like a translation value, not a key
if ':' in normalized:
# Check if this string comes after a colon (likely a value)
parts = normalized.split(':', 1)
if len(parts) == 2 and string_match in parts[1]:
normalized = normalized.replace(string_match, '"VALUE"', 1)
# Normalize whitespace around structural characters
normalized = re.sub(r'\s*:\s*', ': ', normalized)
normalized = re.sub(r'\s*,\s*', ', ', normalized)
normalized = re.sub(r'\s*{\s*', '{ ', normalized)
normalized = re.sub(r'\s*}\s*', ' }', normalized)
return normalized.strip()
def test_locale_files_formatting_consistency():
"""Test that all locale files have identical formatting (whitespace, indentation, etc.)."""
print("\nTesting locale files formatting consistency...")
locales_dir = os.path.join(os.path.dirname(__file__), 'locales')
expected_locales = ['en', 'zh-CN', 'zh-TW', 'ja', 'ru', 'de', 'fr', 'es', 'ko']
# Read reference file (en.json)
reference_path = os.path.join(locales_dir, 'en.json')
try:
with open(reference_path, 'r', encoding='utf-8') as f:
reference_lines = f.readlines()
except Exception as e:
print(f"❌ Error reading reference file: {e}")
return False
success = True
# Compare each locale file
for locale in expected_locales[1:]: # Skip 'en' as it's the reference
locale_path = os.path.join(locales_dir, f'{locale}.json')
if not os.path.exists(locale_path):
print(f"{locale}.json does not exist!")
success = False
continue
try:
with open(locale_path, 'r', encoding='utf-8') as f:
locale_lines = f.readlines()
# Compare line count
if len(locale_lines) != len(reference_lines):
print(f"{locale}.json: Line count differs from reference")
print(f" Reference: {len(reference_lines)} lines")
print(f" {locale}: {len(locale_lines)} lines")
success = False
continue
# Compare formatting with improved algorithm
formatting_issues = compare_line_formats(reference_lines, locale_lines, locale)
if formatting_issues:
print(f"{locale}.json: Formatting issues found")
# Show only the first few issues to avoid spam
shown_issues = 0
for issue in formatting_issues:
if shown_issues < 3: # Reduced from 5 to 3
print(f" - {issue}")
shown_issues += 1
else:
break
if len(formatting_issues) > 3:
print(f" ... and {len(formatting_issues) - 3} more issues")
# Provide debug info for first issue to help identify false positives
if formatting_issues:
first_issue = formatting_issues[0]
line_match = re.match(r'Line (\d+):', first_issue)
if line_match:
line_num = int(line_match.group(1)) - 1 # Convert to 0-based
if 0 <= line_num < len(reference_lines):
print(f" Debug - Reference line {line_num + 1}: {repr(reference_lines[line_num].rstrip())}")
print(f" Debug - {locale} line {line_num + 1}: {repr(locale_lines[line_num].rstrip())}")
success = False
else:
print(f"{locale}.json: Formatting consistent with reference")
except Exception as e:
print(f"❌ Error validating {locale}.json: {e}")
success = False
if success:
print("✅ All locale files have consistent formatting")
else:
print("💡 Note: Some formatting differences may be false positives due to translation content.")
print(" If translations are correct but structure appears different, the test may need refinement.")
return success
def test_locale_key_ordering():
"""Test that all locale files maintain the same key ordering as the reference."""
print("\nTesting locale files key ordering...")
locales_dir = os.path.join(os.path.dirname(__file__), 'locales')
expected_locales = ['en', 'zh-CN', 'zh-TW', 'ja', 'ru', 'de', 'fr', 'es', 'ko']
# Load reference file
reference_path = os.path.join(locales_dir, 'en.json')
try:
with open(reference_path, 'r', encoding='utf-8') as f:
reference_data = json.load(f, object_pairs_hook=lambda x: x) # Preserve order
reference_key_order = get_key_order(reference_data)
except Exception as e:
print(f"❌ Error reading reference file: {e}")
return False
success = True
for locale in expected_locales[1:]: # Skip 'en' as it's the reference
locale_path = os.path.join(locales_dir, f'{locale}.json')
if not os.path.exists(locale_path):
continue
try:
with open(locale_path, 'r', encoding='utf-8') as f:
locale_data = json.load(f, object_pairs_hook=lambda x: x) # Preserve order
locale_key_order = get_key_order(locale_data)
if reference_key_order != locale_key_order:
print(f"{locale}.json: Key ordering differs from reference")
# Find the first difference
for i, (ref_key, locale_key) in enumerate(zip(reference_key_order, locale_key_order)):
if ref_key != locale_key:
print(f" First difference at position {i}: '{ref_key}' vs '{locale_key}'")
break
success = False
else:
print(f"{locale}.json: Key ordering matches reference")
except Exception as e:
print(f"❌ Error validating {locale}.json key ordering: {e}")
success = False
return success
def get_key_order(data: Any, path: str = '') -> List[str]:
"""
Extract the order of keys from nested JSON data.
Returns a list of all keys in their order of appearance.
"""
keys = []
if isinstance(data, list):
# Handle list of key-value pairs (from object_pairs_hook)
for key, value in data:
current_path = f"{path}.{key}" if path else key
keys.append(current_path)
if isinstance(value, list): # Nested object as list of pairs
keys.extend(get_key_order(value, current_path))
elif isinstance(data, dict):
for key, value in data.items():
current_path = f"{path}.{key}" if path else key
keys.append(current_path)
if isinstance(value, (dict, list)):
keys.extend(get_key_order(value, current_path))
return keys
def test_server_i18n():
"""Test the Python server-side i18n system."""
print("\nTesting Python server-side i18n...")
try:
from py.services.server_i18n import ServerI18nManager
# Create a new instance to test
i18n = ServerI18nManager()
# Test that translations loaded
available_locales = i18n.get_available_locales()
if not available_locales:
print("❌ No locales loaded in server i18n!")
return False
print(f"✅ Loaded {len(available_locales)} locales: {', '.join(available_locales)}")
# Test English translations
i18n.set_locale('en')
test_key = 'common.status.loading'
translation = i18n.get_translation(test_key)
if translation == test_key:
print(f"❌ Translation not found for key '{test_key}'")
return False
print(f"✅ English translation for '{test_key}': '{translation}'")
# Test Chinese translations
i18n.set_locale('zh-CN')
translation_cn = i18n.get_translation(test_key)
if translation_cn == test_key:
print(f"❌ Chinese translation not found for key '{test_key}'")
return False
print(f"✅ Chinese translation for '{test_key}': '{translation_cn}'")
# Test parameter interpolation
param_key = 'common.itemCount'
translation_with_params = i18n.get_translation(param_key, count=42)
if '{count}' in translation_with_params:
print(f"❌ Parameter interpolation failed for key '{param_key}'")
return False
print(f"✅ Parameter interpolation for '{param_key}': '{translation_with_params}'")
print("✅ Server-side i18n system working correctly")
return True
except Exception as e:
print(f"❌ Error testing server i18n: {e}")
import traceback
traceback.print_exc()
return False
def test_translation_completeness():
"""Test that all languages have the same translation keys."""
print("\nTesting translation completeness...")
locales_dir = os.path.join(os.path.dirname(__file__), 'locales')
# Load English as reference
with open(os.path.join(locales_dir, 'en.json'), 'r', encoding='utf-8') as f:
en_data = json.load(f)
en_keys = get_all_translation_keys(en_data)
print(f"English has {len(en_keys)} translation keys")
# Check other languages
locales = ['zh-CN', 'zh-TW', 'ja', 'ru', 'de', 'fr', 'es', 'ko']
for locale in locales:
with open(os.path.join(locales_dir, f'{locale}.json'), 'r', encoding='utf-8') as f:
locale_data = json.load(f)
locale_keys = get_all_translation_keys(locale_data)
missing_keys = en_keys - locale_keys
extra_keys = locale_keys - en_keys
if missing_keys:
print(f"{locale} missing keys: {len(missing_keys)}")
# Print first few missing keys
for key in sorted(missing_keys)[:5]:
print(f" - {key}")
if len(missing_keys) > 5:
print(f" ... and {len(missing_keys) - 5} more")
if extra_keys:
print(f"⚠️ {locale} has extra keys: {len(extra_keys)}")
if not missing_keys and not extra_keys:
print(f"{locale} has complete translations ({len(locale_keys)} keys)")
return True
def extract_i18n_keys_from_js(file_path: str) -> Set[str]:
"""Extract translation keys from JavaScript files."""
keys = set()
try:
with open(file_path, 'r', encoding='utf-8') as f:
content = f.read()
# Remove comments to avoid false positives
# Remove single-line comments
content = re.sub(r'//.*$', '', content, flags=re.MULTILINE)
# Remove multi-line comments
content = re.sub(r'/\*.*?\*/', '', content, flags=re.DOTALL)
# Pattern for translate() function calls - more specific
# Matches: translate('key.name', ...) or translate("key.name", ...)
# Must have opening parenthesis immediately after translate
translate_pattern = r"\btranslate\s*\(\s*['\"]([a-zA-Z0-9._-]+)['\"]"
translate_matches = re.findall(translate_pattern, content)
# Filter out single words that are likely not translation keys
# Translation keys should typically have dots or be in specific namespaces
filtered_translate = [key for key in translate_matches if '.' in key or key in [
'loading', 'error', 'success', 'warning', 'info', 'cancel', 'save', 'delete'
]]
keys.update(filtered_translate)
# Pattern for showToast() function calls - more specific
# Matches: showToast('key.name', ...) or showToast("key.name", ...)
showtoast_pattern = r"\bshowToast\s*\(\s*['\"]([a-zA-Z0-9._-]+)['\"]"
showtoast_matches = re.findall(showtoast_pattern, content)
# Filter showToast matches as well
filtered_showtoast = [key for key in showtoast_matches if '.' in key or key in [
'loading', 'error', 'success', 'warning', 'info', 'cancel', 'save', 'delete'
]]
keys.update(filtered_showtoast)
# Additional patterns for other i18n function calls you might have
# Pattern for t() function calls (if used in JavaScript)
t_pattern = r"\bt\s*\(\s*['\"]([a-zA-Z0-9._-]+)['\"]"
t_matches = re.findall(t_pattern, content)
filtered_t = [key for key in t_matches if '.' in key or key in [
'loading', 'error', 'success', 'warning', 'info', 'cancel', 'save', 'delete'
]]
keys.update(filtered_t)
except Exception as e:
print(f"⚠️ Error reading {file_path}: {e}")
return keys
def extract_i18n_keys_from_html(file_path: str) -> Set[str]:
"""Extract translation keys from HTML template files."""
keys = set()
try:
with open(file_path, 'r', encoding='utf-8') as f:
content = f.read()
# Remove HTML comments to avoid false positives
content = re.sub(r'<!--.*?-->', '', content, flags=re.DOTALL)
# Pattern for t() function calls in Jinja2 templates
# Matches: {{ t('key.name') }} or {% ... t('key.name') ... %}
# More specific pattern that ensures we're in template context
t_pattern = r"(?:\{\{|\{%)[^}]*\bt\s*\(\s*['\"]([a-zA-Z0-9._-]+)['\"][^}]*(?:\}\}|%\})"
t_matches = re.findall(t_pattern, content)
# Filter HTML matches
filtered_t = [key for key in t_matches if '.' in key or key in [
'loading', 'error', 'success', 'warning', 'info', 'cancel', 'save', 'delete'
]]
keys.update(filtered_t)
# Also check for translate() calls in script tags within HTML
script_pattern = r'<script[^>]*>(.*?)</script>'
script_matches = re.findall(script_pattern, content, flags=re.DOTALL)
for script_content in script_matches:
# Apply JavaScript extraction to script content
translate_pattern = r"\btranslate\s*\(\s*['\"]([a-zA-Z0-9._-]+)['\"]"
script_translate_matches = re.findall(translate_pattern, script_content)
filtered_script = [key for key in script_translate_matches if '.' in key]
keys.update(filtered_script)
except Exception as e:
print(f"⚠️ Error reading {file_path}: {e}")
return keys
def get_all_translation_keys(data: dict, prefix: str = '', include_containers: bool = False) -> Set[str]:
"""
Recursively collect translation keys.
By default only leaf keys (where the value is NOT a dict) are returned so that
structural/container nodes (e.g. 'common', 'common.actions') are not treated
as real translation entries and won't appear in the 'unused' list.
Set include_containers=True to also include container/object nodes.
"""
keys: Set[str] = set()
if not isinstance(data, dict):
return keys
for key, value in data.items():
full_key = f"{prefix}.{key}" if prefix else key
if isinstance(value, dict):
# Recurse first
keys.update(get_all_translation_keys(value, full_key, include_containers))
# Optionally include container nodes
if include_containers:
keys.add(full_key)
else:
# Leaf node: actual translatable value
keys.add(full_key)
return keys
def test_static_code_analysis():
"""Test static code analysis to detect missing translation keys."""
# print("\nTesting static code analysis for translation keys...")
# Load English translations as reference
locales_dir = os.path.join(os.path.dirname(__file__), 'locales')
with open(os.path.join(locales_dir, 'en.json'), 'r', encoding='utf-8') as f:
en_data = json.load(f)
available_keys = get_all_translation_keys(en_data)
# print(f"Available translation keys in en.json: {len(available_keys)}")
# Known false positives to exclude from analysis
# These are typically HTML attributes, CSS classes, or other non-translation strings
false_positives = {
'checkpoint', 'civitai_api_key', 'div', 'embedding', 'lora', 'show_only_sfw',
'model', 'type', 'name', 'value', 'id', 'class', 'style', 'src', 'href',
'data', 'width', 'height', 'size', 'format', 'version', 'url', 'path',
'file', 'folder', 'image', 'text', 'number', 'boolean', 'array', 'object', 'non.existent.key'
}
# Extract keys from JavaScript files
js_dir = os.path.join(os.path.dirname(__file__), 'static', 'js')
js_files = []
if os.path.exists(js_dir):
# Recursively find all JS files
for root, dirs, files in os.walk(js_dir):
for file in files:
if file.endswith('.js'):
js_files.append(os.path.join(root, file))
js_keys = set()
js_files_with_keys = []
for js_file in js_files:
file_keys = extract_i18n_keys_from_js(js_file)
# Filter out false positives
file_keys = file_keys - false_positives
js_keys.update(file_keys)
if file_keys:
rel_path = os.path.relpath(js_file, os.path.dirname(__file__))
js_files_with_keys.append((rel_path, len(file_keys)))
# print(f" Found {len(file_keys)} keys in {rel_path}")
# print(f"Total unique keys found in JavaScript files: {len(js_keys)}")
# Extract keys from HTML template files
templates_dir = os.path.join(os.path.dirname(__file__), 'templates')
html_files = []
if os.path.exists(templates_dir):
html_files = glob.glob(os.path.join(templates_dir, '*.html'))
# Also check for HTML files in subdirectories
html_files.extend(glob.glob(os.path.join(templates_dir, '**', '*.html'), recursive=True))
html_keys = set()
html_files_with_keys = []
for html_file in html_files:
file_keys = extract_i18n_keys_from_html(html_file)
# Filter out false positives
file_keys = file_keys - false_positives
html_keys.update(file_keys)
if file_keys:
rel_path = os.path.relpath(html_file, os.path.dirname(__file__))
html_files_with_keys.append((rel_path, len(file_keys)))
# print(f" Found {len(file_keys)} keys in {rel_path}")
# print(f"Total unique keys found in HTML templates: {len(html_keys)}")
# Combine all used keys
all_used_keys = js_keys.union(html_keys)
# print(f"Total unique keys used in code: {len(all_used_keys)}")
# Check for missing keys
missing_keys = all_used_keys - available_keys
unused_keys = available_keys - all_used_keys
success = True
if missing_keys:
print(f"\n❌ Found {len(missing_keys)} missing translation keys:")
for key in sorted(missing_keys):
print(f" - {key}")
success = False
# Group missing keys by category for better analysis
key_categories = {}
for key in missing_keys:
category = key.split('.')[0] if '.' in key else 'root'
if category not in key_categories:
key_categories[category] = []
key_categories[category].append(key)
print(f"\n Missing keys by category:")
for category, keys in sorted(key_categories.items()):
print(f" {category}: {len(keys)} keys")
# Provide helpful suggestion
print(f"\n💡 If these are false positives, add them to the false_positives set in test_static_code_analysis()")
else:
print("\n✅ All translation keys used in code are available in en.json")
if unused_keys:
print(f"\n⚠️ Found {len(unused_keys)} unused translation keys in en.json:")
# Only show first 20 to avoid cluttering output
for key in sorted(unused_keys)[:20]:
print(f" - {key}")
if len(unused_keys) > 20:
print(f" ... and {len(unused_keys) - 20} more")
# Group unused keys by category for better analysis
unused_categories = {}
for key in unused_keys:
category = key.split('.')[0] if '.' in key else 'root'
if category not in unused_categories:
unused_categories[category] = []
unused_categories[category].append(key)
print(f"\n Unused keys by category:")
for category, keys in sorted(unused_categories.items()):
print(f" {category}: {len(keys)} keys")
# Summary statistics
# print(f"\n📊 Static Code Analysis Summary:")
# print(f" JavaScript files analyzed: {len(js_files)}")
# print(f" JavaScript files with translations: {len(js_files_with_keys)}")
# print(f" HTML template files analyzed: {len(html_files)}")
# print(f" HTML template files with translations: {len(html_files_with_keys)}")
# print(f" Translation keys in en.json: {len(available_keys)}")
# print(f" Translation keys used in code: {len(all_used_keys)}")
# print(f" Usage coverage: {len(all_used_keys)/len(available_keys)*100:.1f}%")
return success
def test_json_structure_validation():
"""Test JSON file structure and syntax validation."""
print("\nTesting JSON file structure and syntax validation...")
locales_dir = os.path.join(os.path.dirname(__file__), 'locales')
if not os.path.exists(locales_dir):
print("❌ Locales directory does not exist!")
return False
expected_locales = ['en', 'zh-CN', 'zh-TW', 'ja', 'ru', 'de', 'fr', 'es', 'ko']
success = True
for locale in expected_locales:
file_path = os.path.join(locales_dir, f'{locale}.json')
if not os.path.exists(file_path):
print(f"{locale}.json does not exist!")
success = False
continue
try:
with open(file_path, 'r', encoding='utf-8') as f:
data = json.load(f)
# Check for valid JSON structure
if not isinstance(data, dict):
print(f"{locale}.json root must be an object/dictionary")
success = False
continue
# Check that required sections exist
required_sections = ['common', 'header', 'loras', 'recipes', 'modals']
missing_sections = []
for section in required_sections:
if section not in data:
missing_sections.append(section)
if missing_sections:
print(f"{locale}.json missing required sections: {', '.join(missing_sections)}")
success = False
# Check for empty values
empty_values = []
def check_empty_values(obj, path=''):
if isinstance(obj, dict):
for key, value in obj.items():
current_path = f"{path}.{key}" if path else key
if isinstance(value, dict):
check_empty_values(value, current_path)
elif isinstance(value, str) and not value.strip():
empty_values.append(current_path)
elif value is None:
empty_values.append(current_path)
check_empty_values(data)
if empty_values:
print(f"⚠️ {locale}.json has {len(empty_values)} empty translation values:")
for path in empty_values[:5]: # Show first 5
print(f" - {path}")
if len(empty_values) > 5:
print(f" ... and {len(empty_values) - 5} more")
print(f"{locale}.json structure is valid")
except json.JSONDecodeError as e:
print(f"{locale}.json has invalid JSON syntax: {e}")
success = False
except Exception as e:
print(f"❌ Error validating {locale}.json: {e}")
success = False
return success
def main():
"""Run all tests."""
print("🚀 Testing updated i18n system...\n")
success = True
# Test JSON files structure and syntax
if not test_json_files_exist():
success = False
# Test comprehensive structural consistency
if not test_locale_files_structural_consistency():
success = False
# Test formatting consistency
if not test_locale_files_formatting_consistency():
success = False
# Test key ordering
if not test_locale_key_ordering():
success = False
# Test server i18n
if not test_server_i18n():
success = False
# Test translation completeness
if not test_translation_completeness():
success = False
# Test static code analysis
if not test_static_code_analysis():
success = False
print(f"\n{'🎉 All tests passed!' if success else '❌ Some tests failed!'}")
return success
if __name__ == '__main__':
main()