jlin53882 · jlin53882 · Mar 23, 2026 · Mar 23, 2026 · Mar 23, 2026 · Mar 23, 2026
diff --git a/translation_tool/checkers/color_char_checker.py b/translation_tool/checkers/color_char_checker.py
@@ -0,0 +1,118 @@
+"""translation_tool/checkers/color_char_checker.py 模組。
+
+用途：檢查翻譯檔案中的非法顏色字元（& 後接非法的 Minecraft 顏色代碼字元）。
+維護注意：本檔案的函式 docstring 用於維護說明，不代表行為變更。
+"""
+
+import json
+import os
+import re
+from dataclasses import dataclass
+from typing import Any, Generator
+
+# 核心檢查：& 後只能接 a-v（不含 w）、0-9、空格、\、#
+# 合法字元：a-v, 0-9, whitespace, backslash, hash
+# 違法：& 後面接了 a-v 與 0-9、空格、\、# 以外的任何字元
+COLOR_PATTERN = re.compile(r"&([^a-v0-9\s\\#])")
+
+
+@dataclass
+class ColorCharError:
+    """單一顏色字元錯誤。"""
+
+    file_path: str
+    key: str
+    value: str
+    illegal_char: str
+    position: int  # 在 value 中的位置
+    message: str
+
+
+def check_color_chars(value: str) -> list[ColorCharError] | None:
+    """檢查單一字串中的非法顏色字元。
+
+    Args:
+        value: 要檢查的字串。
+
+    Returns:
+        錯誤列表（若無錯誤則回傳 None）。
+    """
+    errors: list[ColorCharError] = []
+    for match in COLOR_PATTERN.finditer(value):
+        illegal_char = match.group(1)
+        pos = match.start()
+        errors.append(
+            ColorCharError(
+                file_path="",
+                key="",
+                value=value,
+                illegal_char=illegal_char,
+                position=pos,
+                message=f"在位置 {pos} 發現非法顏色字元 '&{illegal_char}'，"
+                f"& 後只能接 a-v（不含 w）、0-9、空格、\\、#。",
+            )
+        )
+    return errors if errors else None
-def check_color_chars(value: str) -> list[ColorCharError] | None:
-    """檢查單一字串中的非法顏色字元。
-
-    Args:
-        value: 要檢查的字串。
-
-    Returns:
-        錯誤列表（若無錯誤則回傳 None）。
-    """
-    errors: list[ColorCharError] = []
-    for match in COLOR_PATTERN.finditer(value):
-        illegal_char = match.group(1)
-        pos = match.start()
-        errors.append(
-            ColorCharError(
-                file_path="",
-                key="",
-                value=value,
-                illegal_char=illegal_char,
-                position=pos,
-                message=f"在位置 {pos} 發現非法顏色字元 '&{illegal_char}'，"
-                f"& 後只能接 a-v（不含 w）、0-9、空格、\\、#。",
-            )
-        )
-    return errors if errors else None
+def check_color_chars(value: str) -> list[ColorCharError]:
+    """檢查單一字串中的非法顏色字元。
+
+    Args:
+        value: 要檢查的字串。
+
+    Returns:
+        錯誤列表（若無錯誤則回傳空列表）。
+    """
+    errors: list[ColorCharError] = []
+    for match in COLOR_PATTERN.finditer(value):
+        illegal_char = match.group(1)
+        pos = match.start()
+        errors.append(
+            ColorCharError(
+                file_path="",
+                key="",
+                value=value,
+                illegal_char=illegal_char,
+                position=pos,
+                message=f"在位置 {pos} 發現非法顏色字元 '&{illegal_char}'，"
+                f"& 後只能接 a-v（不含 w）、0-9、空格、\\、#。",
+            )
+        )
+    return errors
-def check_color_chars(value: str) -> list[ColorCharError] | None:
-    """檢查單一字串中的非法顏色字元。
-
-    Args:
-        value: 要檢查的字串。
-
-    Returns:
-        錯誤列表（若無錯誤則回傳 None）。
-    """
-    errors: list[ColorCharError] = []
-    for match in COLOR_PATTERN.finditer(value):
-        illegal_char = match.group(1)
-        pos = match.start()
-        errors.append(
-            ColorCharError(
-                file_path="",
-                key="",
-                value=value,
-                illegal_char=illegal_char,
-                position=pos,
-                message=f"在位置 {pos} 發現非法顏色字元 '&{illegal_char}'，"
-                f"& 後只能接 a-v（不含 w）、0-9、空格、\\、#。",
-            )
-        )
-    return errors if errors else None
+def check_color_chars(value: str) -> list[ColorCharError]:
+    """檢查單一字串中的非法顏色字元。
+
+    Args:
+        value: 要檢查的字串。
+
+    Returns:
+        錯誤列表（若無錯誤則回傳空列表）。
+    """
+    errors: list[ColorCharError] = []
+    for match in COLOR_PATTERN.finditer(value):
+        illegal_char = match.group(1)
+        pos = match.start()
+        errors.append(
+            ColorCharError(
+                file_path="",
+                key="",
+                value=value,
+                illegal_char=illegal_char,
+                position=pos,
+                message=f"在位置 {pos} 發現非法顏色字元 '&{illegal_char}'，"
+                f"& 後只能接 a-v（不含 w）、0-9、空格、\\、#。",
+            )
+        )
+    return errors
+
+
+def _check_value(
+    file_path: str,
+    key: str,
+    value: Any,
+) -> Generator[ColorCharError, None, None]:
+    """遞迴檢查單一值，若為字串則檢查顏色字元。"""
+    if isinstance(value, str):
+        errors = check_color_chars(value)
+        if errors:
+            for err in errors:
+                # 補足 file_path 與 key（從上層傳入）
+                yield ColorCharError(
+                    file_path=err.file_path or file_path,
+                    key=err.key or key,
+                    value=err.value,
+                    illegal_char=err.illegal_char,
+                    position=err.position,
+                    message=err.message,
+                )
+    elif isinstance(value, dict):
+        for k, v in value.items():
+            yield from _check_value(file_path, k, v)
-    elif isinstance(value, dict):
-        for k, v in value.items():
-            yield from _check_value(file_path, k, v)
+    elif isinstance(value, dict):
+        for k, v in value.items():
+            nested_key = f"{key}.{k}" if key else k
+            yield from _check_value(file_path, nested_key, v)
-    elif isinstance(value, dict):
-        for k, v in value.items():
-            yield from _check_value(file_path, k, v)
+    elif isinstance(value, dict):
+        for k, v in value.items():
+            nested_key = f"{key}.{k}" if key else k
+            yield from _check_value(file_path, nested_key, v)
+    elif isinstance(value, list):
+        for i, item in enumerate(value):
+            yield from _check_value(file_path, f"{key}[{i}]", item)
+
+
+def check_json_file(file_path: str) -> Generator[ColorCharError, None, None]:
+    """讀取 JSON 檔並遞迴檢查所有 string value。
+
+    Args:
+        file_path: JSON 檔案路徑。
+
+    Yields:
+        找到的 ColorCharError。
+    """
+    try:
+        with open(file_path, encoding="utf-8") as f:
+            data = json.load(f)
+    except Exception:
+        # 不阻断，继续检查其他文件
+        return
+
+    if isinstance(data, dict):
+        for key, value in data.items():
+            yield from _check_value(file_path, key, value)
+
+
+def check_directory(dir_path: str) -> Generator[ColorCharError, None, None]:
+    """遞迴檢查目錄下所有 .json 檔。
+
+    Args:
+        dir_path: 目錄路徑。
+
+    Yields:
+        找到的 ColorCharError。
+    """
+    for root, _, files in os.walk(dir_path):
+        for file in files:
+            if file.endswith(".json"):
+                yield from check_json_file(os.path.join(root, file))
diff --git a/translation_tool/core/kubejs_translator_clean.py b/translation_tool/core/kubejs_translator_clean.py
@@ -203,6 +203,37 @@ def clean_kubejs_from_raw_impl(
             else:
                 pending_en = en
 
+            # ── 雙軌去重（reverse_index dedup）───────────────────────────────
+            # 目的：若某英文文字（value）已出現在 final/zh_tw.json（不同 key），
+            #       表示該英文原文已有翻譯，不需要再送 pending。
+            # 建立 reverse_index：{英文文字: [key1, key2, ...]}
+            if pending_en and final_root_p.exists():
+                # 從 final/zh_tw.json 建立 final_tw_lookup（key → 原文）
+                final_tw_lookup: dict[str, str] = {}
+                for tw_file in final_root_p.rglob("zh_tw.json"):
+                    tw_data = read_json_dict_fn(tw_file)
+                    if tw_data:
+                        final_tw_lookup.update(tw_data)
+
+                if final_tw_lookup:
+                    # 建立 reverse_index（英文文字 → 對應 key 列表）
+                    reverse_index: dict[str, list[str]] = {}
+                    for k, v in final_tw_lookup.items():
+                        if is_filled_text_impl(v):
+                            reverse_index.setdefault(v, []).append(k)
+
+                    # 過濾 pending_en：跳過那些「英文文字已存在於 final」的 key
+                    pending_en = {
+                        k: v
+                        for k, v in pending_en.items()
+                        if not (
+                            is_filled_text_impl(v)
+                            and v in reverse_index
+                            and k != reverse_index[v][0]
+                        )
+                    }
+            # ── 雙軌去重 end ───────────────────────────────────────────────
+
             if pending_en:
                 dst_en = pending_root_p / rel_group / "en_us.json"
                 write_json_fn(dst_en, pending_en)