Add translation cache for faster repeated translations (5000 entry LRU cache with hit rate tracking)

2025-11-30 21:37:11 +01:00 · 2025-11-30 21:37:11 +01:00 · b65e683d32
commit b65e683d32
parent d2b820c6f1
2 changed files with 102 additions and 14 deletions
--- a/main.py
+++ b/main.py
@ -21,6 +21,7 @@ import time
 from config import config
 from translators import excel_translator, word_translator, pptx_translator
 from utils import file_handler, handle_translation_error, DocumentProcessingError
 from services.translation_service import _translation_cache
 # Import auth routes
 from routes.auth_routes import router as auth_router
@ -228,7 +229,8 @@ async def health_check():
            "rate_limits": {
                "requests_per_minute": rate_limit_config.requests_per_minute,
                "translations_per_minute": rate_limit_config.translations_per_minute,
-            }
+            },
            "translation_cache": _translation_cache.stats()
        }
    )
--- a/services/translation_service.py
+++ b/services/translation_service.py
@ -1,7 +1,7 @@
 """
 Translation Service Abstraction
 Provides a unified interface for different translation providers
-Optimized for high performance with parallel processing
+Optimized for high performance with parallel processing and caching
 """
 from abc import ABC, abstractmethod
 from typing import Optional, List, Dict, Tuple
@ -13,12 +13,77 @@ import threading
 import asyncio
 from functools import lru_cache
 import time
 import hashlib
 from collections import OrderedDict
 # Global thread pool for parallel translations
 _executor = concurrent.futures.ThreadPoolExecutor(max_workers=8)
 class TranslationCache:
    """Thread-safe LRU cache for translations to avoid redundant API calls"""
    def __init__(self, maxsize: int = 5000):
        self.cache: OrderedDict = OrderedDict()
        self.maxsize = maxsize
        self.lock = threading.RLock()
        self.hits = 0
        self.misses = 0
    def _make_key(self, text: str, target_language: str, source_language: str, provider: str) -> str:
        """Create a unique cache key"""
        content = f"{provider}:{source_language}:{target_language}:{text}"
        return hashlib.md5(content.encode('utf-8')).hexdigest()
    def get(self, text: str, target_language: str, source_language: str, provider: str) -> Optional[str]:
        """Get a cached translation if available"""
        key = self._make_key(text, target_language, source_language, provider)
        with self.lock:
            if key in self.cache:
                self.hits += 1
                # Move to end (most recently used)
                self.cache.move_to_end(key)
                return self.cache[key]
            self.misses += 1
            return None
    def set(self, text: str, target_language: str, source_language: str, provider: str, translation: str):
        """Cache a translation result"""
        key = self._make_key(text, target_language, source_language, provider)
        with self.lock:
            if key in self.cache:
                self.cache.move_to_end(key)
            self.cache[key] = translation
            # Remove oldest if exceeding maxsize
            while len(self.cache) > self.maxsize:
                self.cache.popitem(last=False)
    def clear(self):
        """Clear the cache"""
        with self.lock:
            self.cache.clear()
            self.hits = 0
            self.misses = 0
    def stats(self) -> Dict:
        """Get cache statistics"""
        with self.lock:
            total = self.hits + self.misses
            hit_rate = (self.hits / total * 100) if total > 0 else 0
            return {
                "size": len(self.cache),
                "maxsize": self.maxsize,
                "hits": self.hits,
                "misses": self.misses,
                "hit_rate": f"{hit_rate:.1f}%"
            }
 # Global translation cache
 _translation_cache = TranslationCache(maxsize=5000)
 class TranslationProvider(ABC):
    """Abstract base class for translation providers"""
@ -63,10 +128,11 @@ class TranslationProvider(ABC):
 class GoogleTranslationProvider(TranslationProvider):
-    """Google Translate implementation with batch support"""
+    """Google Translate implementation with batch support and caching"""
    def __init__(self):
        self._local = threading.local()
        self.provider_name = "google"
    def _get_translator(self, source_language: str, target_language: str) -> GoogleTranslator:
        """Get or create a translator instance for the current thread"""
@ -81,9 +147,17 @@ class GoogleTranslationProvider(TranslationProvider):
        if not text or not text.strip():
            return text
        # Check cache first
        cached = _translation_cache.get(text, target_language, source_language, self.provider_name)
        if cached is not None:
            return cached
        try:
            translator = self._get_translator(source_language, target_language)
-            return translator.translate(text)
+            result = translator.translate(text)
            # Cache the result
            _translation_cache.set(text, target_language, source_language, self.provider_name, result)
            return result
        except Exception as e:
            print(f"Translation error: {e}")
            return text
@ -91,7 +165,7 @@ class GoogleTranslationProvider(TranslationProvider):
    def translate_batch(self, texts: List[str], target_language: str, source_language: str = 'auto', batch_size: int = 50) -> List[str]:
        """
        Translate multiple texts using batch processing for speed.
-        Uses deep_translator's batch capability when possible.
+        Uses caching to avoid redundant translations.
        """
        if not texts:
            return []
@ -100,15 +174,24 @@ class GoogleTranslationProvider(TranslationProvider):
        results = [''] * len(texts)
        non_empty_indices = []
        non_empty_texts = []
        texts_to_translate = []
        indices_to_translate = []
        for i, text in enumerate(texts):
            if text and text.strip():
-                non_empty_indices.append(i)
+                # Check cache first
-                non_empty_texts.append(text)
+                cached = _translation_cache.get(text, target_language, source_language, self.provider_name)
                if cached is not None:
                    results[i] = cached
                else:
                    non_empty_indices.append(i)
                    non_empty_texts.append(text)
                    texts_to_translate.append(text)
                    indices_to_translate.append(i)
            else:
                results[i] = text if text else ''
-        if not non_empty_texts:
+        if not texts_to_translate:
            return results
        try:
@ -116,8 +199,8 @@ class GoogleTranslationProvider(TranslationProvider):
            # Process in batches
            translated_texts = []
-            for i in range(0, len(non_empty_texts), batch_size):
+            for i in range(0, len(texts_to_translate), batch_size):
-                batch = non_empty_texts[i:i + batch_size]
+                batch = texts_to_translate[i:i + batch_size]
                try:
                    # Use translate_batch if available
                    if hasattr(translator, 'translate_batch'):
@ -145,16 +228,19 @@ class GoogleTranslationProvider(TranslationProvider):
                        except:
                            translated_texts.append(text)
-            # Map back to original positions
+            # Map back to original positions and cache results
-            for idx, translated in zip(non_empty_indices, translated_texts):
+            for idx, (original, translated) in zip(indices_to_translate, zip(texts_to_translate, translated_texts)):
-                results[idx] = translated if translated else texts[idx]
+                result = translated if translated else texts[idx]
                results[idx] = result
                # Cache successful translations
                _translation_cache.set(texts[idx], target_language, source_language, self.provider_name, result)
            return results
        except Exception as e:
            print(f"Batch translation failed: {e}")
            # Fallback to individual translations
-            for idx, text in zip(non_empty_indices, non_empty_texts):
+            for idx, text in zip(indices_to_translate, texts_to_translate):
                try:
                    results[idx] = GoogleTranslator(source=source_language, target=target_language).translate(text) or text
                except: