2 miesięcy temu · 1c542067c7
--- a/src/translator/__init__.py
+++ b/src/translator/__init__.py
@@ -9,6 +9,14 @@ from .engine import TranslationEngine
 
				 from .pipeline import TranslationPipeline
			
 
				 from .chapter_translator import ChapterTranslator
			
 
				 from .progress import ProgressReporter, ProgressCallback
			
 
				+from .term_injector import (
			
 
				+    TermInjector,
			
 
				+    TermValidator,
			
 
				+    TermStatistics,
			
 
				+    TermValidationResult,
			
 
				+    TermResult,
			
 
				+    TermUsageRecord,
			
 
				+)
			
 
				 
			
 
				 __all__ = [
			
 
				     "TranslationEngine",
			
@@ -16,4 +24,10 @@ __all__ = [
 
				     "ChapterTranslator",
			
 
				     "ProgressReporter",
			
 
				     "ProgressCallback",
			
 
				+    "TermInjector",
			
 
				+    "TermValidator",
			
 
				+    "TermStatistics",
			
 
				+    "TermValidationResult",
			
 
				+    "TermResult",
			
 
				+    "TermUsageRecord",
			
 
				 ]
			
--- a/src/translator/pipeline.py
+++ b/src/translator/pipeline.py
@@ -6,12 +6,13 @@ the translation engine with glossary preprocessing and post-processing.
 
				 """
			
 
				 
			
 
				 from dataclasses import dataclass
			
 
				-from typing import Dict, List, Optional, Tuple
			
 
				+from typing import Dict, List, Optional, Tuple, Any
			
 
				 
			
 
				 from ..glossary.models import Glossary, GlossaryEntry
			
 
				 from ..glossary.pipeline import GlossaryPipeline
			
 
				 from ..glossary.postprocessor import GlossaryPostprocessor
			
 
				 from .engine import TranslationEngine
			
 
				+from .term_injector import TermInjector, TermValidator, TermStatistics, TermValidationResult
			
 
				 
			
 
				 
			
 
				 @dataclass
			
@@ -25,6 +26,7 @@ class TranslationResult:
 
				         raw_translation: Raw translation before post-processing
			
 
				         terms_used: List of glossary terms used in preprocessing
			
 
				         placeholder_map: Mapping of placeholders to translations
			
 
				+        validation: Optional term validation result
			
 
				     """
			
 
				 
			
 
				     original: str
			
@@ -32,6 +34,7 @@ class TranslationResult:
 
				     raw_translation: str
			
 
				     terms_used: List[str]
			
 
				     placeholder_map: Dict[str, str]
			
 
				+    validation: Optional[TermValidationResult] = None
			
 
				 
			
 
				 
			
 
				 class TranslationPipeline:
			
@@ -40,8 +43,11 @@ class TranslationPipeline:
 
				 
			
 
				     This pipeline integrates:
			
 
				     1. Glossary preprocessing (term replacement with placeholders)
			
 
				-    2. Translation via m2m100
			
 
				-    3. Post-processing (placeholder restoration and cleanup)
			
 
				+    2. Term injection (generating prompts with terminology guidance)
			
 
				+    3. Translation via m2m100
			
 
				+    4. Post-processing (placeholder restoration and cleanup)
			
 
				+    5. Term validation (checking translation consistency)
			
 
				+    6. Statistics tracking (recording term usage)
			
 
				 
			
 
				     Example:
			
 
				         >>> glossary = Glossary()
			
@@ -57,7 +63,8 @@ class TranslationPipeline:
 
				         engine: TranslationEngine,
			
 
				         glossary: Optional[Glossary] = None,
			
 
				         src_lang: str = "zh",
			
 
				-        tgt_lang: str = "en"
			
 
				+        tgt_lang: str = "en",
			
 
				+        enable_validation: bool = True
			
 
				     ):
			
 
				         """
			
 
				         Initialize the translation pipeline.
			
@@ -67,6 +74,7 @@ class TranslationPipeline:
 
				             glossary: Optional glossary for terminology management
			
 
				             src_lang: Source language code
			
 
				             tgt_lang: Target language code
			
 
				+            enable_validation: Whether to enable term validation
			
 
				         """
			
 
				         self.engine = engine
			
 
				         self.glossary = glossary or Glossary()
			
@@ -74,6 +82,12 @@ class TranslationPipeline:
 
				         self.postprocessor = GlossaryPostprocessor()
			
 
				         self.src_lang = src_lang
			
 
				         self.tgt_lang = tgt_lang
			
 
				+        self.enable_validation = enable_validation
			
 
				+
			
 
				+        # Initialize term injection components
			
 
				+        self.term_injector = TermInjector(self.glossary, src_lang, tgt_lang)
			
 
				+        self.term_validator = TermValidator(self.glossary)
			
 
				+        self.statistics = TermStatistics()
			
 
				 
			
 
				     @property
			
 
				     def has_glossary(self) -> bool:
			
@@ -107,13 +121,37 @@ class TranslationPipeline:
 
				         # Step 3: Post-processing
			
 
				         final_translation = self.postprocessor.process(raw_translation, placeholder_map)
			
 
				 
			
 
				+        # Step 4: Term validation (if enabled)
			
 
				+        validation = None
			
 
				+        if self.enable_validation and terms_used:
			
 
				+            # Get the actual entries for validation
			
 
				+            entries = [self.glossary.get(term) for term in terms_used if self.glossary.get(term)]
			
 
				+            if entries:
			
 
				+                validation = self.term_validator.validate_translation(
			
 
				+                    source=text,
			
 
				+                    target=final_translation,
			
 
				+                    terms=entries
			
 
				+                )
			
 
				+
			
 
				+                # Record statistics for each term
			
 
				+                for entry in entries:
			
 
				+                    term_result = validation.term_results.get(entry.source)
			
 
				+                    if term_result:
			
 
				+                        self.statistics.record_usage(
			
 
				+                            term=entry.source,
			
 
				+                            expected=entry.target,
			
 
				+                            success=term_result.success,
			
 
				+                            context=term_result.context
			
 
				+                        )
			
 
				+
			
 
				         if return_details:
			
 
				             return TranslationResult(
			
 
				                 original=text,
			
 
				                 translated=final_translation,
			
 
				                 raw_translation=raw_translation,
			
 
				                 terms_used=terms_used,
			
 
				-                placeholder_map=placeholder_map
			
 
				+                placeholder_map=placeholder_map,
			
 
				+                validation=validation
			
 
				             )
			
 
				 
			
 
				         return final_translation
			
@@ -161,13 +199,40 @@ class TranslationPipeline:
 
				                 all_placeholder_maps[i]
			
 
				             )
			
 
				 
			
 
				+            # Validate and record statistics if enabled
			
 
				+            validation = None
			
 
				+            if self.enable_validation and all_terms_used[i]:
			
 
				+                entries = [
			
 
				+                    self.glossary.get(term)
			
 
				+                    for term in all_terms_used[i]
			
 
				+                    if self.glossary.get(term)
			
 
				+                ]
			
 
				+                if entries:
			
 
				+                    validation = self.term_validator.validate_translation(
			
 
				+                        source=texts[i],
			
 
				+                        target=final_translation,
			
 
				+                        terms=entries
			
 
				+                    )
			
 
				+
			
 
				+                    # Record statistics
			
 
				+                    for entry in entries:
			
 
				+                        term_result = validation.term_results.get(entry.source)
			
 
				+                        if term_result:
			
 
				+                            self.statistics.record_usage(
			
 
				+                                term=entry.source,
			
 
				+                                expected=entry.target,
			
 
				+                                success=term_result.success,
			
 
				+                                context=term_result.context
			
 
				+                            )
			
 
				+
			
 
				             if return_details:
			
 
				                 results.append(TranslationResult(
			
 
				                     original=texts[i],
			
 
				                     translated=final_translation,
			
 
				                     raw_translation=raw_translation,
			
 
				                     terms_used=all_terms_used[i],
			
 
				-                    placeholder_map=all_placeholder_maps[i]
			
 
				+                    placeholder_map=all_placeholder_maps[i],
			
 
				+                    validation=validation
			
 
				                 ))
			
 
				             else:
			
 
				                 results.append(final_translation)
			
@@ -183,6 +248,9 @@ class TranslationPipeline:
 
				         """
			
 
				         self.glossary = glossary
			
 
				         self.glossary_pipeline = GlossaryPipeline(glossary)
			
 
				+        # Update term injection components
			
 
				+        self.term_injector = TermInjector(glossary, self.src_lang, self.tgt_lang)
			
 
				+        self.term_validator = TermValidator(glossary)
			
 
				 
			
 
				     def add_term(self, entry: GlossaryEntry) -> None:
			
 
				         """
			
@@ -220,3 +288,65 @@ class TranslationPipeline:
 
				             Dictionary mapping term names to occurrence counts
			
 
				         """
			
 
				         return self.glossary_pipeline.get_statistics(text)
			
 
				+
			
 
				+    def get_term_statistics(self) -> Dict[str, Any]:
			
 
				+        """
			
 
				+        Get term translation statistics from the pipeline.
			
 
				+
			
 
				+        Returns:
			
 
				+            Dictionary containing statistics about term usage
			
 
				+        """
			
 
				+        return self.statistics.get_statistics()
			
 
				+
			
 
				+    def get_validation_report(self) -> str:
			
 
				+        """
			
 
				+        Generate a human-readable validation report.
			
 
				+
			
 
				+        Returns:
			
 
				+            Formatted report string
			
 
				+        """
			
 
				+        return self.statistics.generate_report()
			
 
				+
			
 
				+    def reset_statistics(self) -> None:
			
 
				+        """Reset all term usage statistics."""
			
 
				+        self.statistics.reset()
			
 
				+
			
 
				+    def get_term_injection_prompt(self, text: str) -> str:
			
 
				+        """
			
 
				+        Generate a term injection prompt for the given text.
			
 
				+
			
 
				+        This can be used with LLM-based translation engines
			
 
				+        that accept prompts for terminology guidance.
			
 
				+
			
 
				+        Args:
			
 
				+            text: The text to translate
			
 
				+
			
 
				+        Returns:
			
 
				+            A prompt string with terminology guidance
			
 
				+        """
			
 
				+        return self.term_injector.generate_prompt(text)
			
 
				+
			
 
				+    def validate_translation(
			
 
				+        self,
			
 
				+        source: str,
			
 
				+        target: str
			
 
				+    ) -> Optional[TermValidationResult]:
			
 
				+        """
			
 
				+        Validate a translation against the glossary.
			
 
				+
			
 
				+        Args:
			
 
				+            source: Original source text
			
 
				+            target: Translated text to validate
			
 
				+
			
 
				+        Returns:
			
 
				+            TermValidationResult or None if no terms found
			
 
				+        """
			
 
				+        entries = []
			
 
				+        for entry in self.glossary.get_all():
			
 
				+            if entry.source in source:
			
 
				+                entries.append(entry)
			
 
				+
			
 
				+        if not entries:
			
 
				+            return None
			
 
				+
			
 
				+        return self.term_validator.validate_translation(source, target, entries)
			
--- a/src/translator/term_injector.py
+++ b/src/translator/term_injector.py
@@ -0,0 +1,592 @@
 
				+"""
			
 
				+Term injection module for enhanced translation consistency.
			
 
				+
			
 
				+This module provides functionality for injecting terminology guidance
			
 
				+into the translation process, validating term consistency, and tracking
			
 
				+statistics about term usage.
			
 
				+"""
			
 
				+
			
 
				+import re
			
 
				+from dataclasses import dataclass, field
			
 
				+from typing import Dict, List, Optional, Any, Set
			
 
				+from collections import defaultdict
			
 
				+
			
 
				+from ..glossary.models import Glossary, GlossaryEntry, TermCategory
			
 
				+
			
 
				+
			
 
				+@dataclass
			
 
				+class TermValidationResult:
			
 
				+    """
			
 
				+    Result of validating term consistency in translation.
			
 
				+
			
 
				+    Attributes:
			
 
				+        is_valid: Whether all terms were translated consistently
			
 
				+        term_results: Dictionary mapping source terms to validation results
			
 
				+        success_rate: Percentage of terms that were successfully translated
			
 
				+        issues: List of issues found during validation
			
 
				+    """
			
 
				+
			
 
				+    is_valid: bool
			
 
				+    term_results: Dict[str, "TermResult"]
			
 
				+    success_rate: float
			
 
				+    issues: List[str] = field(default_factory=list)
			
 
				+
			
 
				+    @property
			
 
				+    def successful_terms(self) -> Set[str]:
			
 
				+        """Set of terms that were successfully translated."""
			
 
				+        return {term for term, result in self.term_results.items() if result.success}
			
 
				+
			
 
				+    @property
			
 
				+    def failed_terms(self) -> Set[str]:
			
 
				+        """Set of terms that failed validation."""
			
 
				+        return {term for term, result in self.term_results.items() if not result.success}
			
 
				+
			
 
				+
			
 
				+@dataclass
			
 
				+class TermResult:
			
 
				+    """
			
 
				+    Result for a single term validation.
			
 
				+
			
 
				+    Attributes:
			
 
				+        source: The source term
			
 
				+        expected: The expected translation
			
 
				+        found: Whether the expected translation was found
			
 
				+        success: Whether the validation passed
			
 
				+        context: Context about where/how the term was validated
			
 
				+    """
			
 
				+
			
 
				+    source: str
			
 
				+    expected: str
			
 
				+    found: bool
			
 
				+    success: bool
			
 
				+    context: str = ""
			
 
				+
			
 
				+
			
 
				+@dataclass
			
 
				+class TermUsageRecord:
			
 
				+    """
			
 
				+    A single record of term usage during translation.
			
 
				+
			
 
				+    Attributes:
			
 
				+        term: The source term
			
 
				+        expected: The expected translation
			
 
				+        success: Whether the term was correctly translated
			
 
				+        context: The text context where the term was used
			
 
				+    """
			
 
				+
			
 
				+    term: str
			
 
				+    expected: str
			
 
				+    success: bool
			
 
				+    context: str
			
 
				+
			
 
				+
			
 
				+class TermInjector:
			
 
				+    """
			
 
				+    Injects terminology guidance into the translation process.
			
 
				+
			
 
				+    This class generates prompts that include glossary information
			
 
				+    to guide translation models toward consistent terminology usage.
			
 
				+    """
			
 
				+
			
 
				+    def __init__(self, glossary: Glossary, src_lang: str = "zh", tgt_lang: str = "en"):
			
 
				+        """
			
 
				+        Initialize the term injector.
			
 
				+
			
 
				+        Args:
			
 
				+            glossary: The glossary containing terminology
			
 
				+            src_lang: Source language code
			
 
				+            tgt_lang: Target language code
			
 
				+        """
			
 
				+        self.glossary = glossary
			
 
				+        self.src_lang = src_lang
			
 
				+        self.tgt_lang = tgt_lang
			
 
				+
			
 
				+    def generate_prompt(
			
 
				+        self,
			
 
				+        source_text: str,
			
 
				+        include_examples: bool = True,
			
 
				+        max_examples: int = 5
			
 
				+    ) -> str:
			
 
				+        """
			
 
				+        Generate a translation prompt with terminology guidance.
			
 
				+
			
 
				+        This creates a prompt that can be used with LLM-based translation
			
 
				+        systems to ensure consistent terminology usage.
			
 
				+
			
 
				+        Args:
			
 
				+            source_text: The text to translate
			
 
				+            include_examples: Whether to include few-shot examples
			
 
				+            max_examples: Maximum number of examples to include
			
 
				+
			
 
				+        Returns:
			
 
				+            A prompt string with terminology guidance
			
 
				+        """
			
 
				+        # Get relevant terms for the source text
			
 
				+        relevant_terms = self._get_relevant_terms(source_text)
			
 
				+
			
 
				+        if not relevant_terms:
			
 
				+            # No terms to inject, return just the source text
			
 
				+            return source_text
			
 
				+
			
 
				+        # Build the prompt
			
 
				+        prompt_parts = []
			
 
				+
			
 
				+        # Add system instruction
			
 
				+        prompt_parts.append(self._build_system_instruction())
			
 
				+
			
 
				+        # Add terminology table
			
 
				+        prompt_parts.append(self._build_terminology_table(relevant_terms))
			
 
				+
			
 
				+        # Add few-shot examples if requested
			
 
				+        if include_examples:
			
 
				+            examples = self._generate_examples(relevant_terms[:max_examples])
			
 
				+            prompt_parts.append(examples)
			
 
				+
			
 
				+        # Add the text to translate
			
 
				+        prompt_parts.append(f"\nText to translate:\n{source_text}")
			
 
				+
			
 
				+        return "\n".join(prompt_parts)
			
 
				+
			
 
				+    def _get_relevant_terms(self, source_text: str) -> List[GlossaryEntry]:
			
 
				+        """
			
 
				+        Get glossary terms that appear in the source text.
			
 
				+
			
 
				+        Args:
			
 
				+            source_text: The text to check for terms
			
 
				+
			
 
				+        Returns:
			
 
				+            List of relevant GlossaryEntry objects
			
 
				+        """
			
 
				+        relevant = []
			
 
				+        for entry in self.glossary.get_all():
			
 
				+            if entry.source in source_text:
			
 
				+                relevant.append(entry)
			
 
				+
			
 
				+        # Sort by length (longest first) for consistency
			
 
				+        relevant.sort(key=lambda e: len(e.source), reverse=True)
			
 
				+        return relevant
			
 
				+
			
 
				+    def _build_system_instruction(self) -> str:
			
 
				+        """
			
 
				+        Build the system instruction for the prompt.
			
 
				+
			
 
				+        Returns:
			
 
				+            System instruction string
			
 
				+        """
			
 
				+        lang_names = {
			
 
				+            "zh": "Chinese",
			
 
				+            "en": "English",
			
 
				+            "ja": "Japanese",
			
 
				+            "ko": "Korean",
			
 
				+        }
			
 
				+        src_name = lang_names.get(self.src_lang, self.src_lang)
			
 
				+        tgt_name = lang_names.get(self.tgt_lang, self.tgt_lang)
			
 
				+
			
 
				+        return (
			
 
				+            f"You are translating from {src_name} to {tgt_name}. "
			
 
				+            "Use the terminology table below to ensure consistent translation "
			
 
				+            "of specific terms. Always translate the terms in the table exactly "
			
 
				+            "as specified, even if different translations might be possible."
			
 
				+        )
			
 
				+
			
 
				+    def _build_terminology_table(self, terms: List[GlossaryEntry]) -> str:
			
 
				+        """
			
 
				+        Build a terminology table for the prompt.
			
 
				+
			
 
				+        Args:
			
 
				+            terms: List of terms to include
			
 
				+
			
 
				+        Returns:
			
 
				+            Formatted terminology table string
			
 
				+        """
			
 
				+        lines = ["\nTerminology Table:"]
			
 
				+        lines.append("-" * 50)
			
 
				+
			
 
				+        # Group by category for better organization
			
 
				+        by_category: Dict[TermCategory, List[GlossaryEntry]] = defaultdict(list)
			
 
				+        for term in terms:
			
 
				+            by_category[term.category].append(term)
			
 
				+
			
 
				+        for category in TermCategory:
			
 
				+            if category not in by_category:
			
 
				+                continue
			
 
				+            lines.append(f"\n{category.value.title()}:")
			
 
				+            for entry in by_category[category]:
			
 
				+                context_note = f" ({entry.context})" if entry.context else ""
			
 
				+                lines.append(f"  - {entry.source} → {entry.target}{context_note}")
			
 
				+
			
 
				+        lines.append("-" * 50)
			
 
				+        return "\n".join(lines)
			
 
				+
			
 
				+    def _generate_examples(self, terms: List[GlossaryEntry]) -> str:
			
 
				+        """
			
 
				+        Generate few-shot examples for the prompt.
			
 
				+
			
 
				+        Args:
			
 
				+            terms: List of terms to create examples for
			
 
				+
			
 
				+        Returns:
			
 
				+            Formatted examples string
			
 
				+        """
			
 
				+        if not terms:
			
 
				+            return ""
			
 
				+
			
 
				+        lines = ["\nExamples:"]
			
 
				+
			
 
				+        # Create examples using the terms
			
 
				+        for i, entry in enumerate(terms[:3], 1):
			
 
				+            if entry.category == TermCategory.CHARACTER:
			
 
				+                example_src = f"{entry.source}使用了技能"
			
 
				+                example_tgt = f"{entry.target} used a skill"
			
 
				+            elif entry.category == TermCategory.SKILL:
			
 
				+                example_src = f"他施展了{entry.source}"
			
 
				+                example_tgt = f"He cast {entry.target}"
			
 
				+            elif entry.category == TermCategory.LOCATION:
			
 
				+                example_src = f"他来到了{entry.source}"
			
 
				+                example_tgt = f"He arrived at {entry.target}"
			
 
				+            elif entry.category == TermCategory.ITEM:
			
 
				+                example_src = f"他拿起了{entry.source}"
			
 
				+                example_tgt = f"He picked up {entry.target}"
			
 
				+            else:
			
 
				+                example_src = f"这是一个{entry.source}"
			
 
				+                example_tgt = f"This is {entry.target}"
			
 
				+
			
 
				+            lines.append(f"  {i}. {example_src}")
			
 
				+            lines.append(f"     → {example_tgt}")
			
 
				+
			
 
				+        return "\n".join(lines)
			
 
				+
			
 
				+    def inject_terms(self, source_text: str, terms: List[str]) -> str:
			
 
				+        """
			
 
				+        Inject term markers into source text for processing.
			
 
				+
			
 
				+        This is a fallback method for models that don't accept prompts.
			
 
				+        It wraps terms in special markers to help with post-processing.
			
 
				+
			
 
				+        Args:
			
 
				+            source_text: The source text
			
 
				+            terms: List of terms to mark
			
 
				+
			
 
				+        Returns:
			
 
				+            Text with terms wrapped in markers
			
 
				+        """
			
 
				+        result = source_text
			
 
				+        # Sort by length (longest first) for correct replacement
			
 
				+        terms_sorted = sorted(terms, key=len, reverse=True)
			
 
				+
			
 
				+        for term in terms_sorted:
			
 
				+            # Create a marker for the term
			
 
				+            marker = f"[TERM:{term}]"
			
 
				+            result = result.replace(term, marker)
			
 
				+
			
 
				+        return result
			
 
				+
			
 
				+
			
 
				+class TermValidator:
			
 
				+    """
			
 
				+    Validates term consistency in translations.
			
 
				+
			
 
				+    This class checks whether the translated text contains the expected
			
 
				+    translations for all terms from the glossary.
			
 
				+    """
			
 
				+
			
 
				+    def __init__(self, glossary: Glossary):
			
 
				+        """
			
 
				+        Initialize the term validator.
			
 
				+
			
 
				+        Args:
			
 
				+            glossary: The glossary containing expected translations
			
 
				+        """
			
 
				+        self.glossary = glossary
			
 
				+
			
 
				+    def validate_translation(
			
 
				+        self,
			
 
				+        source: str,
			
 
				+        target: str,
			
 
				+        terms: Optional[List[GlossaryEntry]] = None
			
 
				+    ) -> TermValidationResult:
			
 
				+        """
			
 
				+        Validate that translation contains expected term translations.
			
 
				+
			
 
				+        Args:
			
 
				+            source: Original source text
			
 
				+            target: Translated text to validate
			
 
				+            terms: Optional list of specific terms to validate (default: all in glossary)
			
 
				+
			
 
				+        Returns:
			
 
				+            TermValidationResult with validation details
			
 
				+        """
			
 
				+        if terms is None:
			
 
				+            # Find terms that appear in source text
			
 
				+            terms = self._get_source_terms(source)
			
 
				+
			
 
				+        term_results: Dict[str, TermResult] = {}
			
 
				+        issues: List[str] = []
			
 
				+
			
 
				+        for entry in terms:
			
 
				+            result = self._check_term_consistency(source, target, entry)
			
 
				+            term_results[entry.source] = result
			
 
				+
			
 
				+            if not result.success:
			
 
				+                issues.append(
			
 
				+                    f"Term '{entry.source}' not translated as expected. "
			
 
				+                    f"Expected: '{entry.target}', Context: {result.context}"
			
 
				+                )
			
 
				+
			
 
				+        # Calculate success rate
			
 
				+        if term_results:
			
 
				+            successful = sum(1 for r in term_results.values() if r.success)
			
 
				+            success_rate = (successful / len(term_results)) * 100
			
 
				+        else:
			
 
				+            success_rate = 100.0
			
 
				+
			
 
				+        is_valid = all(r.success for r in term_results.values())
			
 
				+
			
 
				+        return TermValidationResult(
			
 
				+            is_valid=is_valid,
			
 
				+            term_results=term_results,
			
 
				+            success_rate=success_rate,
			
 
				+            issues=issues
			
 
				+        )
			
 
				+
			
 
				+    def _get_source_terms(self, source: str) -> List[GlossaryEntry]:
			
 
				+        """
			
 
				+        Get glossary entries that appear in source text.
			
 
				+
			
 
				+        Args:
			
 
				+            source: Source text to check
			
 
				+
			
 
				+        Returns:
			
 
				+            List of relevant GlossaryEntry objects
			
 
				+        """
			
 
				+        terms = []
			
 
				+        for entry in self.glossary.get_all():
			
 
				+            if entry.source in source:
			
 
				+                terms.append(entry)
			
 
				+        return terms
			
 
				+
			
 
				+    def _check_term_consistency(
			
 
				+        self,
			
 
				+        source: str,
			
 
				+        target: str,
			
 
				+        entry: GlossaryEntry
			
 
				+    ) -> TermResult:
			
 
				+        """
			
 
				+        Check if a single term was translated consistently.
			
 
				+
			
 
				+        Args:
			
 
				+            source: Source text
			
 
				+            target: Target translation
			
 
				+            entry: The glossary entry to check
			
 
				+
			
 
				+        Returns:
			
 
				+            TermResult with validation details
			
 
				+        """
			
 
				+        # Check if the expected translation appears in target
			
 
				+        found = entry.target in target
			
 
				+
			
 
				+        # Additional check: count occurrences
			
 
				+        source_count = source.count(entry.source)
			
 
				+        target_count = target.count(entry.target)
			
 
				+
			
 
				+        # Success if found and counts match approximately
			
 
				+        # (allow some flexibility for word order changes)
			
 
				+        success = found and target_count >= source_count * 0.8
			
 
				+
			
 
				+        context = f"source_count={source_count}, target_count={target_count}"
			
 
				+
			
 
				+        return TermResult(
			
 
				+            source=entry.source,
			
 
				+            expected=entry.target,
			
 
				+            found=found,
			
 
				+            success=success,
			
 
				+            context=context
			
 
				+        )
			
 
				+
			
 
				+
			
 
				+class TermStatistics:
			
 
				+    """
			
 
				+    Tracks and reports statistics about term usage during translation.
			
 
				+
			
 
				+    This class records term usage, success/failure rates, and provides
			
 
				+    detailed statistics for reporting.
			
 
				+    """
			
 
				+
			
 
				+    def __init__(self):
			
 
				+        """Initialize an empty statistics tracker."""
			
 
				+        self._records: List[TermUsageRecord] = []
			
 
				+        self._term_counts: Dict[str, int] = defaultdict(int)
			
 
				+        self._term_successes: Dict[str, int] = defaultdict(int)
			
 
				+
			
 
				+    def record_usage(
			
 
				+        self,
			
 
				+        term: str,
			
 
				+        expected: str,
			
 
				+        success: bool,
			
 
				+        context: str = ""
			
 
				+    ) -> None:
			
 
				+        """
			
 
				+        Record a term usage event.
			
 
				+
			
 
				+        Args:
			
 
				+            term: The source term used
			
 
				+            expected: The expected translation
			
 
				+            success: Whether the term was correctly translated
			
 
				+            context: Optional context information
			
 
				+        """
			
 
				+        record = TermUsageRecord(
			
 
				+            term=term,
			
 
				+            expected=expected,
			
 
				+            success=success,
			
 
				+            context=context
			
 
				+        )
			
 
				+        self._records.append(record)
			
 
				+        self._term_counts[term] += 1
			
 
				+        if success:
			
 
				+            self._term_successes[term] += 1
			
 
				+
			
 
				+    def get_statistics(self) -> Dict[str, Any]:
			
 
				+        """
			
 
				+        Get comprehensive statistics about term usage.
			
 
				+
			
 
				+        Returns:
			
 
				+            Dictionary containing statistics:
			
 
				+            - total_usages: Total number of term usage records
			
 
				+            - unique_terms: Number of unique terms used
			
 
				+            - total_successes: Total number of successful translations
			
 
				+            - total_failures: Total number of failed translations
			
 
				+            - overall_success_rate: Overall success rate percentage
			
 
				+            - term_breakdown: Per-term statistics
			
 
				+        """
			
 
				+        total_usages = len(self._records)
			
 
				+        unique_terms = len(self._term_counts)
			
 
				+        total_successes = sum(self._term_successes.values())
			
 
				+        total_failures = total_usages - total_successes
			
 
				+
			
 
				+        overall_rate = (total_successes / total_usages * 100) if total_usages > 0 else 100.0
			
 
				+
			
 
				+        term_breakdown: Dict[str, Dict[str, Any]] = {}
			
 
				+        for term in self._term_counts:
			
 
				+            count = self._term_counts[term]
			
 
				+            successes = self._term_successes[term]
			
 
				+            term_breakdown[term] = {
			
 
				+                "total_usages": count,
			
 
				+                "successes": successes,
			
 
				+                "failures": count - successes,
			
 
				+                "success_rate": (successes / count * 100) if count > 0 else 0
			
 
				+            }
			
 
				+
			
 
				+        return {
			
 
				+            "total_usages": total_usages,
			
 
				+            "unique_terms": unique_terms,
			
 
				+            "total_successes": total_successes,
			
 
				+            "total_failures": total_failures,
			
 
				+            "overall_success_rate": round(overall_rate, 2),
			
 
				+            "term_breakdown": term_breakdown
			
 
				+        }
			
 
				+
			
 
				+    def get_term_statistics(self, term: str) -> Optional[Dict[str, Any]]:
			
 
				+        """
			
 
				+        Get statistics for a specific term.
			
 
				+
			
 
				+        Args:
			
 
				+            term: The term to get statistics for
			
 
				+
			
 
				+        Returns:
			
 
				+            Dictionary with term statistics or None if term not found
			
 
				+        """
			
 
				+        if term not in self._term_counts:
			
 
				+            return None
			
 
				+
			
 
				+        count = self._term_counts[term]
			
 
				+        successes = self._term_successes[term]
			
 
				+
			
 
				+        return {
			
 
				+            "term": term,
			
 
				+            "total_usages": count,
			
 
				+            "successes": successes,
			
 
				+            "failures": count - successes,
			
 
				+            "success_rate": (successes / count * 100) if count > 0 else 0
			
 
				+        }
			
 
				+
			
 
				+    def get_failed_terms(self) -> List[str]:
			
 
				+        """
			
 
				+        Get list of terms that had at least one failure.
			
 
				+
			
 
				+        Returns:
			
 
				+            List of terms with failures
			
 
				+        """
			
 
				+        failed = []
			
 
				+        for term, count in self._term_counts.items():
			
 
				+            successes = self._term_successes.get(term, 0)
			
 
				+            if successes < count:
			
 
				+                failed.append(term)
			
 
				+        return failed
			
 
				+
			
 
				+    def get_records(self) -> List[TermUsageRecord]:
			
 
				+        """
			
 
				+        Get all recorded usage records.
			
 
				+
			
 
				+        Returns:
			
 
				+            List of all TermUsageRecord objects
			
 
				+        """
			
 
				+        return list(self._records)
			
 
				+
			
 
				+    def reset(self) -> None:
			
 
				+        """Reset all statistics."""
			
 
				+        self._records.clear()
			
 
				+        self._term_counts.clear()
			
 
				+        self._term_successes.clear()
			
 
				+
			
 
				+    def merge(self, other: "TermStatistics") -> None:
			
 
				+        """
			
 
				+        Merge statistics from another TermStatistics instance.
			
 
				+
			
 
				+        Args:
			
 
				+            other: Another TermStatistics instance to merge from
			
 
				+        """
			
 
				+        for record in other._records:
			
 
				+            self.record_usage(
			
 
				+                term=record.term,
			
 
				+                expected=record.expected,
			
 
				+                success=record.success,
			
 
				+                context=record.context
			
 
				+            )
			
 
				+
			
 
				+    def __len__(self) -> int:
			
 
				+        """Return the number of recorded usage events."""
			
 
				+        return len(self._records)
			
 
				+
			
 
				+    def generate_report(self) -> str:
			
 
				+        """
			
 
				+        Generate a human-readable statistics report.
			
 
				+
			
 
				+        Returns:
			
 
				+            Formatted report string
			
 
				+        """
			
 
				+        stats = self.get_statistics()
			
 
				+        lines = [
			
 
				+            "=== Term Translation Statistics ===",
			
 
				+            f"Total usages: {stats['total_usages']}",
			
 
				+            f"Unique terms: {stats['unique_terms']}",
			
 
				+            f"Total successes: {stats['total_successes']}",
			
 
				+            f"Total failures: {stats['total_failures']}",
			
 
				+            f"Overall success rate: {stats['overall_success_rate']}%",
			
 
				+            "",
			
 
				+            "Term Breakdown:"
			
 
				+        ]
			
 
				+
			
 
				+        for term, term_stats in sorted(stats['term_breakdown'].items()):
			
 
				+            lines.append(
			
 
				+                f"  {term}: {term_stats['successes']}/{term_stats['total_usages']} "
			
 
				+                f"({term_stats['success_rate']:.1f}%)"
			
 
				+            )
			
 
				+
			
 
				+        if stats['total_failures'] > 0:
			
 
				+            lines.append("")
			
 
				+            lines.append("Failed terms:")
			
 
				+            for term in self.get_failed_terms():
			
 
				+                term_stat = stats['term_breakdown'][term]
			
 
				+                lines.append(f"  - {term}: {term_stat['failures']} failures")
			
 
				+
			
 
				+        return "\n".join(lines)
			
--- a/tests/translator/__init__.py
+++ b/tests/translator/__init__.py
@@ -0,0 +1 @@
 
				+"""Tests for the translator module."""
			
--- a/tests/translator/test_term_injector.py
+++ b/tests/translator/test_term_injector.py
@@ -0,0 +1,510 @@
 
				+"""
			
 
				+Unit tests for the term injection module.
			
 
				+
			
 
				+Tests cover term injection, validation, and statistics tracking.
			
 
				+"""
			
 
				+
			
 
				+import sys
			
 
				+from unittest.mock import Mock
			
 
				+
			
 
				+# Mock torch and transformers before importing
			
 
				+sys_mock = Mock()
			
 
				+sys.modules["torch"] = sys_mock
			
 
				+sys.modules["transformers"] = sys_mock
			
 
				+
			
 
				+import pytest
			
 
				+
			
 
				+from src.glossary.models import Glossary, GlossaryEntry, TermCategory
			
 
				+from src.translator.term_injector import (
			
 
				+    TermInjector,
			
 
				+    TermValidator,
			
 
				+    TermStatistics,
			
 
				+    TermValidationResult,
			
 
				+    TermResult,
			
 
				+    TermUsageRecord,
			
 
				+)
			
 
				+
			
 
				+
			
 
				+class TestTermInjector:
			
 
				+    """Test cases for TermInjector class."""
			
 
				+
			
 
				+    def test_init(self):
			
 
				+        """Test TermInjector initialization."""
			
 
				+        glossary = Glossary()
			
 
				+        injector = TermInjector(glossary, "zh", "en")
			
 
				+
			
 
				+        assert injector.glossary == glossary
			
 
				+        assert injector.src_lang == "zh"
			
 
				+        assert injector.tgt_lang == "en"
			
 
				+
			
 
				+    def test_generate_prompt_with_terms(self):
			
 
				+        """Test prompt generation with glossary terms."""
			
 
				+        glossary = Glossary()
			
 
				+        glossary.add(GlossaryEntry("林风", "Lin Feng", TermCategory.CHARACTER, "Protagonist"))
			
 
				+        glossary.add(GlossaryEntry("火球术", "Fireball", TermCategory.SKILL))
			
 
				+
			
 
				+        injector = TermInjector(glossary, "zh", "en")
			
 
				+        prompt = injector.generate_prompt("林风释放了火球术")
			
 
				+
			
 
				+        # Check that prompt contains key elements
			
 
				+        assert "Chinese" in prompt or "English" in prompt
			
 
				+        assert "林风" in prompt
			
 
				+        assert "Lin Feng" in prompt
			
 
				+        assert "火球术" in prompt
			
 
				+        assert "Fireball" in prompt
			
 
				+        assert "character" in prompt.lower()
			
 
				+        assert "skill" in prompt.lower()
			
 
				+
			
 
				+    def test_generate_prompt_without_examples(self):
			
 
				+        """Test prompt generation without few-shot examples."""
			
 
				+        glossary = Glossary()
			
 
				+        glossary.add(GlossaryEntry("林风", "Lin Feng", TermCategory.CHARACTER))
			
 
				+
			
 
				+        injector = TermInjector(glossary, "zh", "en")
			
 
				+        prompt = injector.generate_prompt("林风来了", include_examples=False)
			
 
				+
			
 
				+        assert "林风" in prompt
			
 
				+        assert "Lin Feng" in prompt
			
 
				+        assert "Examples:" not in prompt
			
 
				+
			
 
				+    def test_generate_prompt_empty_glossary(self):
			
 
				+        """Test prompt generation with empty glossary."""
			
 
				+        glossary = Glossary()
			
 
				+        injector = TermInjector(glossary, "zh", "en")
			
 
				+        prompt = injector.generate_prompt("测试文本")
			
 
				+
			
 
				+        # Should just return the source text
			
 
				+        assert prompt == "测试文本"
			
 
				+
			
 
				+    def test_generate_prompt_max_examples(self):
			
 
				+        """Test prompt generation with limited examples."""
			
 
				+        glossary = Glossary()
			
 
				+        glossary.add(GlossaryEntry("林风", "Lin Feng", TermCategory.CHARACTER))
			
 
				+        glossary.add(GlossaryEntry("火球术", "Fireball", TermCategory.SKILL))
			
 
				+        glossary.add(GlossaryEntry("青云宗", "Qingyun Sect", TermCategory.ORGANIZATION))
			
 
				+        glossary.add(GlossaryEntry("龙剑", "Dragon Sword", TermCategory.ITEM))
			
 
				+
			
 
				+        injector = TermInjector(glossary, "zh", "en")
			
 
				+        prompt = injector.generate_prompt("林风使用龙剑", max_examples=2)
			
 
				+
			
 
				+        # Should limit examples
			
 
				+        assert "Examples:" in prompt
			
 
				+
			
 
				+    def test_inject_terms(self):
			
 
				+        """Test term injection into source text."""
			
 
				+        glossary = Glossary()
			
 
				+        injector = TermInjector(glossary, "zh", "en")
			
 
				+
			
 
				+        result = injector.inject_terms("林风释放了火球术", ["林风", "火球术"])
			
 
				+
			
 
				+        assert "[TERM:林风]" in result
			
 
				+        assert "[TERM:火球术]" in result
			
 
				+
			
 
				+    def test_get_relevant_terms(self):
			
 
				+        """Test getting relevant terms for source text."""
			
 
				+        glossary = Glossary()
			
 
				+        glossary.add(GlossaryEntry("林风", "Lin Feng", TermCategory.CHARACTER))
			
 
				+        glossary.add(GlossaryEntry("火球术", "Fireball", TermCategory.SKILL))
			
 
				+        glossary.add(GlossaryEntry("青云宗", "Qingyun Sect", TermCategory.ORGANIZATION))
			
 
				+
			
 
				+        injector = TermInjector(glossary, "zh", "en")
			
 
				+        relevant = injector._get_relevant_terms("林风释放了火球术")
			
 
				+
			
 
				+        # Should find two terms
			
 
				+        assert len(relevant) == 2
			
 
				+        sources = [t.source for t in relevant]
			
 
				+        assert "林风" in sources
			
 
				+        assert "火球术" in sources
			
 
				+        assert "青云宗" not in sources
			
 
				+
			
 
				+    def test_build_terminology_table(self):
			
 
				+        """Test terminology table building."""
			
 
				+        glossary = Glossary()
			
 
				+        glossary.add(GlossaryEntry("林风", "Lin Feng", TermCategory.CHARACTER))
			
 
				+        glossary.add(GlossaryEntry("火球术", "Fireball", TermCategory.SKILL))
			
 
				+
			
 
				+        injector = TermInjector(glossary, "zh", "en")
			
 
				+        terms = glossary.get_all()
			
 
				+        table = injector._build_terminology_table(terms)
			
 
				+
			
 
				+        assert "Terminology Table:" in table
			
 
				+        assert "林风" in table
			
 
				+        assert "Lin Feng" in table
			
 
				+        assert "Character:" in table
			
 
				+
			
 
				+
			
 
				+class TestTermValidator:
			
 
				+    """Test cases for TermValidator class."""
			
 
				+
			
 
				+    def test_init(self):
			
 
				+        """Test TermValidator initialization."""
			
 
				+        glossary = Glossary()
			
 
				+        validator = TermValidator(glossary)
			
 
				+
			
 
				+        assert validator.glossary == glossary
			
 
				+
			
 
				+    def test_validate_translation_success(self):
			
 
				+        """Test successful validation."""
			
 
				+        glossary = Glossary()
			
 
				+        glossary.add(GlossaryEntry("林风", "Lin Feng", TermCategory.CHARACTER))
			
 
				+
			
 
				+        validator = TermValidator(glossary)
			
 
				+        result = validator.validate_translation(
			
 
				+            source="林风来了",
			
 
				+            target="Lin Feng came"
			
 
				+        )
			
 
				+
			
 
				+        assert result.is_valid is True
			
 
				+        assert result.success_rate == 100.0
			
 
				+        assert len(result.term_results) == 1
			
 
				+        assert result.term_results["林风"].success is True
			
 
				+
			
 
				+    def test_validate_translation_failure(self):
			
 
				+        """Test validation with missing expected translation."""
			
 
				+        glossary = Glossary()
			
 
				+        glossary.add(GlossaryEntry("林风", "Lin Feng", TermCategory.CHARACTER))
			
 
				+
			
 
				+        validator = TermValidator(glossary)
			
 
				+        result = validator.validate_translation(
			
 
				+            source="林风来了",
			
 
				+            target="Lin came"  # Missing "Feng"
			
 
				+        )
			
 
				+
			
 
				+        assert result.is_valid is False
			
 
				+        assert result.success_rate < 100.0
			
 
				+        assert len(result.issues) > 0
			
 
				+
			
 
				+    def test_validate_translation_multiple_terms(self):
			
 
				+        """Test validation with multiple terms."""
			
 
				+        glossary = Glossary()
			
 
				+        glossary.add(GlossaryEntry("林风", "Lin Feng", TermCategory.CHARACTER))
			
 
				+        glossary.add(GlossaryEntry("火球术", "Fireball", TermCategory.SKILL))
			
 
				+
			
 
				+        validator = TermValidator(glossary)
			
 
				+        result = validator.validate_translation(
			
 
				+            source="林风释放了火球术",
			
 
				+            target="Lin Feng released Fireball"
			
 
				+        )
			
 
				+
			
 
				+        assert result.is_valid is True
			
 
				+        assert len(result.term_results) == 2
			
 
				+        assert result.term_results["林风"].success is True
			
 
				+        assert result.term_results["火球术"].success is True
			
 
				+
			
 
				+    def test_validate_translation_partial_match(self):
			
 
				+        """Test validation with partial term match."""
			
 
				+        glossary = Glossary()
			
 
				+        glossary.add(GlossaryEntry("林风", "Lin Feng", TermCategory.CHARACTER))
			
 
				+
			
 
				+        validator = TermValidator(glossary)
			
 
				+        # Multiple occurrences but only one translated correctly
			
 
				+        result = validator.validate_translation(
			
 
				+            source="林风说，林风知道",
			
 
				+            target="Lin Feng said, Lin knows"  # Only one "Lin Feng"
			
 
				+        )
			
 
				+
			
 
				+        # Should detect the mismatch
			
 
				+        assert result.success_rate < 100
			
 
				+
			
 
				+    def test_validate_translation_empty_source(self):
			
 
				+        """Test validation with source text that has no terms."""
			
 
				+        glossary = Glossary()
			
 
				+        glossary.add(GlossaryEntry("林风", "Lin Feng", TermCategory.CHARACTER))
			
 
				+
			
 
				+        validator = TermValidator(glossary)
			
 
				+        result = validator.validate_translation(
			
 
				+            source="这是一个测试",  # No glossary terms
			
 
				+            target="This is a test"
			
 
				+        )
			
 
				+
			
 
				+        assert result.is_valid is True
			
 
				+        assert len(result.term_results) == 0
			
 
				+
			
 
				+    def test_check_term_consistency(self):
			
 
				+        """Test individual term consistency check."""
			
 
				+        glossary = Glossary()
			
 
				+        entry = GlossaryEntry("林风", "Lin Feng", TermCategory.CHARACTER)
			
 
				+        glossary.add(entry)
			
 
				+
			
 
				+        validator = TermValidator(glossary)
			
 
				+
			
 
				+        # Successful case
			
 
				+        result = validator._check_term_consistency(
			
 
				+            source="林风来了",
			
 
				+            target="Lin Feng came",
			
 
				+            entry=entry
			
 
				+        )
			
 
				+        assert result.success is True
			
 
				+        assert result.source == "林风"
			
 
				+        assert result.expected == "Lin Feng"
			
 
				+
			
 
				+        # Failed case
			
 
				+        result = validator._check_term_consistency(
			
 
				+            source="林风来了",
			
 
				+            target="Lin came",
			
 
				+            entry=entry
			
 
				+        )
			
 
				+        assert result.success is False
			
 
				+
			
 
				+    def test_successful_terms_property(self):
			
 
				+        """Test successful_terms property."""
			
 
				+        glossary = Glossary()
			
 
				+        glossary.add(GlossaryEntry("林风", "Lin Feng", TermCategory.CHARACTER))
			
 
				+        glossary.add(GlossaryEntry("火球术", "Fireball", TermCategory.SKILL))
			
 
				+
			
 
				+        validator = TermValidator(glossary)
			
 
				+        result = validator.validate_translation(
			
 
				+            source="林风释放了火球术",
			
 
				+            target="Lin Feng released Fireball"
			
 
				+        )
			
 
				+
			
 
				+        assert "林风" in result.successful_terms
			
 
				+        assert "火球术" in result.successful_terms
			
 
				+
			
 
				+    def test_failed_terms_property(self):
			
 
				+        """Test failed_terms property."""
			
 
				+        glossary = Glossary()
			
 
				+        glossary.add(GlossaryEntry("林风", "Lin Feng", TermCategory.CHARACTER))
			
 
				+        glossary.add(GlossaryEntry("火球术", "Fireball", TermCategory.SKILL))
			
 
				+
			
 
				+        validator = TermValidator(glossary)
			
 
				+        result = validator.validate_translation(
			
 
				+            source="林风释放了火球术",
			
 
				+            target="Lin released Fireball"  # Missing "Feng"
			
 
				+        )
			
 
				+
			
 
				+        assert "林风" in result.failed_terms
			
 
				+        assert "火球术" not in result.failed_terms
			
 
				+
			
 
				+
			
 
				+class TestTermStatistics:
			
 
				+    """Test cases for TermStatistics class."""
			
 
				+
			
 
				+    def test_init(self):
			
 
				+        """Test TermStatistics initialization."""
			
 
				+        stats = TermStatistics()
			
 
				+
			
 
				+        assert len(stats) == 0
			
 
				+        assert stats.get_statistics()["total_usages"] == 0
			
 
				+
			
 
				+    def test_record_usage_success(self):
			
 
				+        """Test recording successful term usage."""
			
 
				+        stats = TermStatistics()
			
 
				+        stats.record_usage(
			
 
				+            term="林风",
			
 
				+            expected="Lin Feng",
			
 
				+            success=True,
			
 
				+            context="source_count=1, target_count=1"
			
 
				+        )
			
 
				+
			
 
				+        assert len(stats) == 1
			
 
				+        stat_dict = stats.get_statistics()
			
 
				+        assert stat_dict["total_usages"] == 1
			
 
				+        assert stat_dict["total_successes"] == 1
			
 
				+        assert stat_dict["total_failures"] == 0
			
 
				+
			
 
				+    def test_record_usage_failure(self):
			
 
				+        """Test recording failed term usage."""
			
 
				+        stats = TermStatistics()
			
 
				+        stats.record_usage(
			
 
				+            term="林风",
			
 
				+            expected="Lin Feng",
			
 
				+            success=False,
			
 
				+            context="source_count=1, target_count=0"
			
 
				+        )
			
 
				+
			
 
				+        assert len(stats) == 1
			
 
				+        stat_dict = stats.get_statistics()
			
 
				+        assert stat_dict["total_usages"] == 1
			
 
				+        assert stat_dict["total_successes"] == 0
			
 
				+        assert stat_dict["total_failures"] == 1
			
 
				+
			
 
				+    def test_record_multiple_usages(self):
			
 
				+        """Test recording multiple term usages."""
			
 
				+        stats = TermStatistics()
			
 
				+
			
 
				+        stats.record_usage("林风", "Lin Feng", True)
			
 
				+        stats.record_usage("林风", "Lin Feng", True)
			
 
				+        stats.record_usage("火球术", "Fireball", False)
			
 
				+
			
 
				+        stat_dict = stats.get_statistics()
			
 
				+        assert stat_dict["total_usages"] == 3
			
 
				+        assert stat_dict["total_successes"] == 2
			
 
				+        assert stat_dict["total_failures"] == 1
			
 
				+        assert stat_dict["unique_terms"] == 2
			
 
				+
			
 
				+    def test_get_term_statistics(self):
			
 
				+        """Test getting statistics for a specific term."""
			
 
				+        stats = TermStatistics()
			
 
				+
			
 
				+        stats.record_usage("林风", "Lin Feng", True)
			
 
				+        stats.record_usage("林风", "Lin Feng", False)
			
 
				+
			
 
				+        term_stats = stats.get_term_statistics("林风")
			
 
				+        assert term_stats is not None
			
 
				+        assert term_stats["term"] == "林风"
			
 
				+        assert term_stats["total_usages"] == 2
			
 
				+        assert term_stats["successes"] == 1
			
 
				+        assert term_stats["failures"] == 1
			
 
				+        assert term_stats["success_rate"] == 50.0
			
 
				+
			
 
				+    def test_get_term_statistics_nonexistent(self):
			
 
				+        """Test getting statistics for a non-existent term."""
			
 
				+        stats = TermStatistics()
			
 
				+        term_stats = stats.get_term_statistics("nonexistent")
			
 
				+
			
 
				+        assert term_stats is None
			
 
				+
			
 
				+    def test_get_failed_terms(self):
			
 
				+        """Test getting list of failed terms."""
			
 
				+        stats = TermStatistics()
			
 
				+
			
 
				+        stats.record_usage("林风", "Lin Feng", True)
			
 
				+        stats.record_usage("火球术", "Fireball", False)
			
 
				+        stats.record_usage("青云宗", "Qingyun Sect", False)
			
 
				+
			
 
				+        failed = stats.get_failed_terms()
			
 
				+        assert "林风" not in failed
			
 
				+        assert "火球术" in failed
			
 
				+        assert "青云宗" in failed
			
 
				+
			
 
				+    def test_reset(self):
			
 
				+        """Test resetting statistics."""
			
 
				+        stats = TermStatistics()
			
 
				+
			
 
				+        stats.record_usage("林风", "Lin Feng", True)
			
 
				+        stats.record_usage("火球术", "Fireball", False)
			
 
				+
			
 
				+        assert len(stats) == 2
			
 
				+
			
 
				+        stats.reset()
			
 
				+
			
 
				+        assert len(stats) == 0
			
 
				+        stat_dict = stats.get_statistics()
			
 
				+        assert stat_dict["total_usages"] == 0
			
 
				+
			
 
				+    def test_merge(self):
			
 
				+        """Test merging statistics from another instance."""
			
 
				+        stats1 = TermStatistics()
			
 
				+        stats1.record_usage("林风", "Lin Feng", True)
			
 
				+
			
 
				+        stats2 = TermStatistics()
			
 
				+        stats2.record_usage("火球术", "Fireball", False)
			
 
				+
			
 
				+        stats1.merge(stats2)
			
 
				+
			
 
				+        assert len(stats1) == 2
			
 
				+        stat_dict = stats1.get_statistics()
			
 
				+        assert stat_dict["unique_terms"] == 2
			
 
				+
			
 
				+    def test_get_records(self):
			
 
				+        """Test getting all recorded usage records."""
			
 
				+        stats = TermStatistics()
			
 
				+
			
 
				+        stats.record_usage("林风", "Lin Feng", True)
			
 
				+        stats.record_usage("火球术", "Fireball", False)
			
 
				+
			
 
				+        records = stats.get_records()
			
 
				+        assert len(records) == 2
			
 
				+        assert all(isinstance(r, TermUsageRecord) for r in records)
			
 
				+
			
 
				+    def test_generate_report(self):
			
 
				+        """Test generating a human-readable report."""
			
 
				+        stats = TermStatistics()
			
 
				+
			
 
				+        stats.record_usage("林风", "Lin Feng", True)
			
 
				+        stats.record_usage("火球术", "Fireball", False)
			
 
				+
			
 
				+        report = stats.generate_report()
			
 
				+
			
 
				+        assert "Term Translation Statistics" in report
			
 
				+        assert "Total usages: 2" in report
			
 
				+        assert "林风" in report
			
 
				+        assert "火球术" in report
			
 
				+        assert "Failed terms:" in report
			
 
				+
			
 
				+    def test_overall_success_rate_calculation(self):
			
 
				+        """Test overall success rate calculation."""
			
 
				+        stats = TermStatistics()
			
 
				+
			
 
				+        stats.record_usage("林风", "Lin Feng", True)
			
 
				+        stats.record_usage("林风", "Lin Feng", True)
			
 
				+        stats.record_usage("火球术", "Fireball", True)
			
 
				+        stats.record_usage("青云宗", "Qingyun Sect", False)
			
 
				+
			
 
				+        stat_dict = stats.get_statistics()
			
 
				+        assert stat_dict["overall_success_rate"] == 75.0
			
 
				+
			
 
				+    def test_empty_statistics(self):
			
 
				+        """Test statistics with no records."""
			
 
				+        stats = TermStatistics()
			
 
				+
			
 
				+        stat_dict = stats.get_statistics()
			
 
				+        assert stat_dict["total_usages"] == 0
			
 
				+        assert stat_dict["unique_terms"] == 0
			
 
				+        assert stat_dict["overall_success_rate"] == 100.0
			
 
				+
			
 
				+        report = stats.generate_report()
			
 
				+        assert "Total usages: 0" in report
			
 
				+
			
 
				+
			
 
				+class TestTermUsageRecord:
			
 
				+    """Test cases for TermUsageRecord dataclass."""
			
 
				+
			
 
				+    def test_create_record(self):
			
 
				+        """Test creating a usage record."""
			
 
				+        record = TermUsageRecord(
			
 
				+            term="林风",
			
 
				+            expected="Lin Feng",
			
 
				+            success=True,
			
 
				+            context="source_count=1"
			
 
				+        )
			
 
				+
			
 
				+        assert record.term == "林风"
			
 
				+        assert record.expected == "Lin Feng"
			
 
				+        assert record.success is True
			
 
				+        assert record.context == "source_count=1"
			
 
				+
			
 
				+
			
 
				+class TestTermResult:
			
 
				+    """Test cases for TermResult dataclass."""
			
 
				+
			
 
				+    def test_create_result(self):
			
 
				+        """Test creating a term result."""
			
 
				+        result = TermResult(
			
 
				+            source="林风",
			
 
				+            expected="Lin Feng",
			
 
				+            found=True,
			
 
				+            success=True,
			
 
				+            context="Valid translation"
			
 
				+        )
			
 
				+
			
 
				+        assert result.source == "林风"
			
 
				+        assert result.expected == "Lin Feng"
			
 
				+        assert result.found is True
			
 
				+        assert result.success is True
			
 
				+        assert result.context == "Valid translation"
			
 
				+
			
 
				+
			
 
				+class TestTermValidationResult:
			
 
				+    """Test cases for TermValidationResult dataclass."""
			
 
				+
			
 
				+    def test_create_validation_result(self):
			
 
				+        """Test creating a validation result."""
			
 
				+        term_results = {
			
 
				+            "林风": TermResult("林风", "Lin Feng", True, True),
			
 
				+            "火球术": TermResult("火球术", "Fireball", False, False)
			
 
				+        }
			
 
				+
			
 
				+        result = TermValidationResult(
			
 
				+            is_valid=False,
			
 
				+            term_results=term_results,
			
 
				+            success_rate=50.0,
			
 
				+            issues=["Fireball not found"]
			
 
				+        )
			
 
				+
			
 
				+        assert result.is_valid is False
			
 
				+        assert result.success_rate == 50.0
			
 
				+        assert len(result.issues) == 1
			
 
				+        assert "林风" in result.successful_terms
			
 
				+        assert "火球术" in result.failed_terms