db65db6232
Android UI Tests / ui-tests (push) Has been cancelled
Localize all user-facing strings across iOS (SwiftUI), shared Kotlin, and Android Compose into en/es/fr/de/pt/it/ja/ko/nl/zh: - iOS String Catalogs: main + widget Localizable.xcstrings, InfoPlist.xcstrings (permissions), plural variations, ~200 new keys translated - Shared Kotlin ClientStrings table + Android composeResources/values-* (884 keys ×10), routed Api/ViewModel/util error & UI strings through localization - Backend-localized lookups/suggestions consumed via display names - Widget extension catalog; theme names, home-profile fallbacks, validation, network errors, accessibility labels all localized Add re-runnable verification gates: - scripts/i18n_audit.py — enumerate every literal, partition to GAP=0 - scripts/i18n_coverage.py — all 10 locales translated, format-specifier parity Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
298 lines
13 KiB
Python
298 lines
13 KiB
Python
#!/usr/bin/env python3
|
|
"""
|
|
i18n_audit.py — exhaustive localization gap detector for honeyDue (KMM).
|
|
|
|
Method: enumerate EVERY prose string literal in the iOS Swift + shared Kotlin
|
|
sources (char-aware: comments and interpolation excluded), then assign each to
|
|
exactly one bucket:
|
|
|
|
LOCALIZED — inside a localization wrapper (String(localized:), stringResource,
|
|
ClientStrings.t, LocalizedStringKey, NSLocalizedString,
|
|
LocalizedStringResource/IntentDescription, ...) or the direct
|
|
literal argument of an auto-localizing SwiftUI view init/modifier
|
|
(Text, Label, Button, .navigationTitle, .accessibilityLabel, ...).
|
|
ALLOWLIST — matches an explicit, reviewable non-UI rule (logging, asset/symbol
|
|
names, color/asset lookups, keys, URLs, routes, regex/predicate,
|
|
date-format patterns, API-value comparisons, serialization, the
|
|
brand name "honeyDue") OR is suppressed by an inline directive.
|
|
GAP — everything else. THIS BUCKET MUST BE EMPTY.
|
|
|
|
"Done" == GAP count is 0: every literal accounted for in LOCALIZED or ALLOWLIST.
|
|
High recall by design. False positives are silenced ONLY by a documented allowlist
|
|
rule or an in-source suppression directive — never by narrowing the enumeration.
|
|
|
|
Inline suppression (auditable; reviewed by the adversarial re-scan):
|
|
"..." // i18n-ignore: <reason> skip literals on this line
|
|
// i18n-ignore-next: <reason> skip the next code line
|
|
// i18n-ignore-begin: <reason> ... // i18n-ignore-end skip the region
|
|
|
|
Usage:
|
|
python3 scripts/i18n_audit.py [--json OUT] [--all] [--allowlist]
|
|
Exit code: 0 if GAP==0 else 1 (CI gate).
|
|
"""
|
|
import os, re, sys, json, argparse
|
|
|
|
ROOT = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
|
|
IOS_DIRS = ["iosApp/iosApp", "iosApp/HoneyDue"]
|
|
KT_DIRS = ["composeApp/src/commonMain/kotlin"]
|
|
|
|
# Files/dirs skipped entirely, each with a reason (test data, samples, analytics
|
|
# identifiers, the translation data store, dev-only screens).
|
|
SKIP_PATH_SUBSTR = {
|
|
"/build/": "build artifacts", "/DerivedData/": "build artifacts",
|
|
"ClientStringsData.kt": "translation data store",
|
|
"/testing/": "test fixtures", "Fixtures.kt": "test fixtures",
|
|
"/analytics/": "analytics event/property identifiers (non-UI)",
|
|
"Greeting.kt": "KMM template boilerplate",
|
|
"/dev/": "dev-only screen (Android, unreachable)",
|
|
"AnimationTestingScreen.kt": "dev-only screen (Android, unregistered route)",
|
|
"SimpleTaskListItem.kt": "dead/unused component",
|
|
# NOTE: iOS /AnimationTesting/ is intentionally NOT skipped — it ships & is
|
|
# reachable from Profile > Completion Animation (no #if DEBUG gate).
|
|
}
|
|
SKIP_PATH_REGEX = re.compile(r"(Tests?/|UITests?/|/Test[A-Z]|Tests\.swift$|/Mock)")
|
|
|
|
# ---------- char-aware literal extraction (comments + triple-strings handled) ----------
|
|
def extract_literals(line, state):
|
|
"""Return list of (col, inner) string literals on `line`; mutate `state`
|
|
(block-comment / triple-string carry across lines)."""
|
|
lits = []
|
|
if state["triple"]:
|
|
idx = line.find('"""')
|
|
if idx < 0:
|
|
return lits
|
|
state["triple"] = False
|
|
line = line[idx + 3:]
|
|
i, n = 0, len(line)
|
|
while i < n:
|
|
if state["block"]:
|
|
j = line.find("*/", i)
|
|
if j < 0:
|
|
return lits
|
|
state["block"] = False
|
|
i = j + 2
|
|
continue
|
|
c = line[i]
|
|
if c == "/" and i + 1 < n and line[i + 1] == "/":
|
|
break # line comment -> rest ignored
|
|
if c == "/" and i + 1 < n and line[i + 1] == "*":
|
|
state["block"] = True
|
|
i += 2
|
|
continue
|
|
if c == '"':
|
|
if line[i:i + 3] == '"""':
|
|
k = line.find('"""', i + 3)
|
|
if k < 0:
|
|
state["triple"] = True
|
|
return lits
|
|
i = k + 3
|
|
continue
|
|
start = i
|
|
i += 1
|
|
buf = []
|
|
while i < n:
|
|
if line[i] == "\\":
|
|
buf.append(line[i:i + 2]); i += 2; continue
|
|
if line[i] == '"':
|
|
break
|
|
buf.append(line[i]); i += 1
|
|
lits.append((start, "".join(buf)))
|
|
i += 1
|
|
continue
|
|
i += 1
|
|
return lits
|
|
|
|
def strip_interpolation(lit):
|
|
lit = re.sub(r"\\\([^)]*\)", "X", lit) # swift \( ... )
|
|
lit = re.sub(r"\$\{[^}]*\}", "X", lit) # kotlin ${ ... }
|
|
lit = re.sub(r"\$[A-Za-z_][A-Za-z0-9_]*", "X", lit) # kotlin $ident
|
|
return lit
|
|
|
|
# ---------- "prose" test ----------
|
|
def is_prose(s):
|
|
st = s.strip()
|
|
if sum(c.isalpha() for c in st) < 2:
|
|
return False
|
|
if re.fullmatch(r"[X\W\s]*", st): # only interpolation residue/punct
|
|
return False
|
|
if re.fullmatch(r"[A-Za-z0-9]+([._\-/][A-Za-z0-9]+)+", st): # dotted.key/snake/kebab/path
|
|
return False
|
|
if ("/" in st or st.startswith("http")) and " " not in st:
|
|
return False
|
|
if re.fullmatch(r"[%@{}\d\s.,:#x*lld$\-]*", st): # format-spec residue
|
|
return False
|
|
if re.fullmatch(r"[a-z][a-z0-9]*", st): # lowercase single token (route/key)
|
|
return False
|
|
if re.fullmatch(r"[A-Z][A-Z0-9_]*", st): # ALLCAPS const / api enum
|
|
return False
|
|
if re.fullmatch(r"#?[0-9A-Fa-f]{3,}", st): # hex/uuid-ish
|
|
return False
|
|
return True
|
|
|
|
def is_regex(s):
|
|
return bool(re.search(r"\\[.dwsDWSbB]|\[[A-Za-z0-9^]|\]\+|\]\*|\]\{|MATCHES|\(\?:|\^|\$$", s))
|
|
|
|
def is_date_pattern(s):
|
|
st = s.strip()
|
|
if not re.search(r"[MdyHhmsaEZ]", st):
|
|
return False
|
|
return bool(re.fullmatch(r"[MdyHhmsaEZ:/.,'\s\-]+", st))
|
|
|
|
LOCALIZED_PREFIX = re.compile(
|
|
r"(String\(\s*localized:\s*|LocalizedStringKey\(\s*|NSLocalizedString\(\s*"
|
|
r"|ClientStrings\.t\(\s*|\.t\(\s*|IntentDescription\(\s*|LocalizedStringResource\(\s*"
|
|
r"|TypeDisplayRepresentation\(\s*name:\s*|DisplayRepresentation\(\s*title:\s*"
|
|
r"|stringResource\(\s*)$")
|
|
|
|
AUTOLOC_PREFIX = re.compile(
|
|
r"(\bText\(\s*|\bText\(\s*verbatim:\s*|\bLabel\(\s*|\bButton\(\s*|\bToggle\(\s*"
|
|
r"|\bPicker\(\s*|\bStepper\(\s*|\bLink\(\s*|\bMenu\(\s*|\bTextField\(\s*"
|
|
r"|\bSecureField\(\s*|\bNavigationLink\(\s*|\bSection\(\s*"
|
|
r"|\.navigationTitle\(\s*|\.navigationBarTitle\(\s*|\.help\(\s*"
|
|
r"|\.accessibilityLabel\(\s*|\.accessibilityHint\(\s*|\.accessibilityValue\(\s*"
|
|
r"|\.alert\(\s*|\.confirmationDialog\(\s*|\.configurationDisplayName\(\s*|\.description\(\s*"
|
|
# `titleKey:` is SwiftUI's documented LocalizedStringKey param. Other labeled
|
|
# args (label:/title:/message:/...) are NOT trusted — custom components often
|
|
# take a plain String and render it verbatim (Text(String)), bypassing the
|
|
# catalog. Those must be explicitly wrapped, so we let them fall through to GAP.
|
|
r"|\btitleKey:\s*)$")
|
|
|
|
ALLOWLIST_PREFIX = re.compile(
|
|
r"(print\(|NSLog\(|os_log|Logger|\bprintln\(|\blog\.|Log\.[a-z]+\("
|
|
r"|\.debug\(|\.error\(|\.info\(|\.warning\(|\.fault\(|\.verbose\("
|
|
r"|systemName:\s*|\bImage\(\s*|\bUIImage\(|named:\s*|Color\(\s*|UIColor\(|themed\(\s*"
|
|
r"|forKey:\s*|forHTTPHeaderField:\s*|setValue\(|withName:\s*|appendPathComponent\(\s*"
|
|
r"|URL\(\s*string:\s*|accessibilityIdentifier\(\s*|\.font\(|Font\(|fontName|infoDictionary\??!?\["
|
|
r"|navigate\(\s*|composable\(\s*|route\s*=\s*|startDestination"
|
|
r"|@SerialName\(\s*|SerialName\(\s*|JSONDecoder|JSONEncoder|NSPredicate\(\s*format:\s*"
|
|
r"|==\s*|!=\s*|\bcase\s+|contains\(\s*|hasPrefix\(\s*|hasSuffix\(\s*|range\(\s*of:\s*"
|
|
r"|\.tag\(\s*|identifier:\s*|kCFBundle|Bundle\.|Notification\.Name\(\s*|previewDisplayName\(\s*"
|
|
r"|NotificationCenter)$")
|
|
|
|
ALLOWLIST_LINE = re.compile(
|
|
r"(accessibilityIdentifier|AccessibilityIdentifiers\.|UserDefaults|keychain|Keychain"
|
|
r"|mimeType|MimeType|contentType:\s*\"|application/json|image/jpeg|text/plain"
|
|
r"|NSPredicate\(format:|\.regularExpression|Icons\.|Notification\.Name\()")
|
|
|
|
# Line declares an iOS LocalizedStringResource / IntentDescription / AppEnum display,
|
|
# or an AppIntent @Parameter(title:) (title is a LocalizedStringResource → auto-localizes).
|
|
LOCALIZED_LINE = re.compile(
|
|
r"(LocalizedStringResource|IntentDescription|DisplayRepresentation|TypeDisplayRepresentation|@Parameter\()")
|
|
|
|
def classify(lang, prefix, inner_clean, raw, suffix):
|
|
tail = prefix[-80:]
|
|
if inner_clean.strip() == "honeyDue":
|
|
return "allowlist"
|
|
if is_regex(inner_clean) or is_date_pattern(inner_clean):
|
|
return "allowlist"
|
|
# Kotlin detection-pattern map: "incoming error substring" to "err.key"
|
|
if lang == "kotlin" and re.match(r'\s*to\s+"', suffix):
|
|
return "allowlist"
|
|
if LOCALIZED_PREFIX.search(tail):
|
|
return "localized"
|
|
if lang == "swift" and (AUTOLOC_PREFIX.search(tail) or LOCALIZED_LINE.search(raw)):
|
|
return "localized"
|
|
if ALLOWLIST_PREFIX.search(tail) or ALLOWLIST_LINE.search(raw):
|
|
return "allowlist"
|
|
return "gap"
|
|
|
|
def scan_file(path, lang):
|
|
rel = os.path.relpath(path, ROOT)
|
|
out = {"localized": [], "allowlist": [], "gap": []}
|
|
try:
|
|
lines = open(path, encoding="utf-8").read().splitlines()
|
|
except Exception:
|
|
return out
|
|
state = {"block": False, "triple": False}
|
|
ignore_region = False
|
|
ignore_next = False
|
|
preview_depth = 0 # >0 while inside a #Preview / PreviewProvider block
|
|
for ln, raw in enumerate(lines, 1):
|
|
line_ignored = ignore_next
|
|
ignore_next = False
|
|
if "i18n-ignore-begin" in raw:
|
|
ignore_region = True
|
|
if "i18n-ignore-end" in raw:
|
|
ignore_region = False
|
|
if "i18n-ignore-next" in raw:
|
|
ignore_next = True
|
|
lits = extract_literals(raw, state)
|
|
# --- #Preview / PreviewProvider block skip (mock/sample data, not shipped UI) ---
|
|
if preview_depth == 0 and re.search(r"#Preview\b|PreviewProvider|_Previews\b", raw):
|
|
preview_depth = 1 if "{" not in raw else 0 # arm; depth counted below
|
|
if preview_depth > 0 or re.search(r"#Preview\b|PreviewProvider|_Previews\b", raw):
|
|
preview_depth += raw.count("{") - raw.count("}")
|
|
if preview_depth < 0:
|
|
preview_depth = 0
|
|
continue
|
|
if ignore_region or line_ignored:
|
|
continue
|
|
line_suppress = "i18n-ignore" in raw and "i18n-ignore-next" not in raw
|
|
for start, inner in lits:
|
|
inner_clean = strip_interpolation(inner)
|
|
if not is_prose(inner_clean):
|
|
continue
|
|
if line_suppress:
|
|
out["allowlist"].append({"file": rel, "line": ln, "text": inner, "ctx": raw.strip()[:160], "supp": True})
|
|
continue
|
|
end = start + 1
|
|
# locate closing quote to compute suffix
|
|
k = raw.find('"', start + 1)
|
|
while k != -1 and raw[k - 1] == "\\":
|
|
k = raw.find('"', k + 1)
|
|
suffix = raw[k + 1:] if k != -1 else ""
|
|
b = classify(lang, raw[:start], inner_clean, raw, suffix)
|
|
out[b].append({"file": rel, "line": ln, "text": inner, "ctx": raw.strip()[:160]})
|
|
return out
|
|
|
|
def collect():
|
|
files = []
|
|
for d in IOS_DIRS + KT_DIRS:
|
|
base = os.path.join(ROOT, d)
|
|
lang = "swift" if "iosApp" in d else "kotlin"
|
|
for r, _, fs in os.walk(base):
|
|
for f in fs:
|
|
if f.endswith(".swift") or f.endswith(".kt"):
|
|
files.append((os.path.join(r, f), "swift" if f.endswith(".swift") else "kotlin"))
|
|
res = {"localized": [], "allowlist": [], "gap": []}
|
|
for path, lang in files:
|
|
rel = os.path.relpath(path, ROOT)
|
|
if any(s in path for s in SKIP_PATH_SUBSTR) or SKIP_PATH_REGEX.search(rel):
|
|
continue
|
|
r = scan_file(path, lang)
|
|
for k in res:
|
|
res[k].extend(r[k])
|
|
return res
|
|
|
|
def main():
|
|
ap = argparse.ArgumentParser()
|
|
ap.add_argument("--json")
|
|
ap.add_argument("--all", action="store_true")
|
|
ap.add_argument("--allowlist", action="store_true")
|
|
args = ap.parse_args()
|
|
res = collect()
|
|
g = res["gap"]
|
|
print("\n=== i18n audit ===")
|
|
print(f"LOCALIZED : {len(res['localized'])}")
|
|
print(f"ALLOWLIST : {len(res['allowlist'])} (incl. {sum(1 for x in res['allowlist'] if x.get('supp'))} inline-suppressed)")
|
|
print(f"GAP : {len(g)}")
|
|
by_file = {}
|
|
for r in g:
|
|
by_file.setdefault(r["file"], []).append(r)
|
|
print(f"\n--- GAPS in {len(by_file)} files ---")
|
|
for f in sorted(by_file):
|
|
print(f"\n{f} ({len(by_file[f])})")
|
|
for r in by_file[f]:
|
|
print(f" {r['line']:>4}: \"{r['text']}\"")
|
|
if args.json:
|
|
json.dump(res, open(args.json, "w"), ensure_ascii=False, indent=2)
|
|
print(f"\nwrote {args.json}")
|
|
if args.allowlist:
|
|
print("\n--- ALLOWLIST (non-suppressed) sample ---")
|
|
for r in [x for x in res["allowlist"] if not x.get("supp")][:60]:
|
|
print(f" {r['file']}:{r['line']}: \"{r['text']}\"")
|
|
sys.exit(0 if not g else 1)
|
|
|
|
if __name__ == "__main__":
|
|
main()
|