hydropix
diff --git a/‎src/api/translation_state.py‎
Lines changed: 22 additions & 5 deletions b/‎src/api/translation_state.py‎
Lines changed: 22 additions & 5 deletions
diff --git a/‎src/api/websocket.py‎
Lines changed: 8 additions & 0 deletions b/‎src/api/websocket.py‎
Lines changed: 8 additions & 0 deletions
diff --git a/‎src/core/adapters/generic_translator.py‎
Lines changed: 41 additions & 0 deletions b/‎src/core/adapters/generic_translator.py‎
Lines changed: 41 additions & 0 deletions
diff --git a/‎src/core/adapters/translate_file.py‎
Lines changed: 4 additions & 4 deletions b/‎src/core/adapters/translate_file.py‎
Lines changed: 4 additions & 4 deletions
diff --git a/‎src/persistence/checkpoint_manager.py‎
Lines changed: 147 additions & 3 deletions b/‎src/persistence/checkpoint_manager.py‎
Lines changed: 147 additions & 3 deletions
@@ -4,18 +4,28 @@
 import threading
 import time
 import copy
+import uuid
 from datetime import datetime
 from typing import Dict, Any, Optional
 from src.persistence.checkpoint_manager import CheckpointManager
 
 
+def generate_server_session_id() -> str:
+    """Generate a unique session ID for this server instance."""
+    return str(uuid.uuid4())
+
+
 class TranslationStateManager:
     """Thread-safe manager for translation state"""
 
-    def __init__(self, checkpoint_manager: Optional[CheckpointManager] = None):
+    def __init__(self, checkpoint_manager: Optional[CheckpointManager] = None, server_session_id: Optional[str] = None):
         self._translations: Dict[str, Dict[str, Any]] = {}
         self._lock = threading.RLock()  # Use RLock to allow nested locking
-        self.checkpoint_manager = checkpoint_manager or CheckpointManager()
+        # Generate a unique session ID for this server instance
+        self.server_session_id = server_session_id or generate_server_session_id()
+        self.checkpoint_manager = checkpoint_manager or CheckpointManager(
+            server_session_id=self.server_session_id
+        )
 
     def create_translation(self, translation_id: str, config: Dict[str, Any]) -> None:
         """Create a new translation entry"""
@@ -124,13 +134,20 @@ def get_translation_summaries(self) -> list:
         with self._lock:
             summaries = []
             for tid, data in self._translations.items():
+                config = data.get('config', {})
+                stats = data.get('stats', {})
                 summaries.append({
                     "translation_id": tid,
                     "status": data.get('status'),
                     "progress": data.get('progress'),
-                    "start_time": data.get('stats', {}).get('start_time'),
-                    "output_filename": data.get('config', {}).get('output_filename'),
-                    "file_type": data.get('config', {}).get('file_type', 'txt')
+                    "start_time": stats.get('start_time'),
+                    "output_filename": config.get('output_filename'),
+                    "input_filename": config.get('input_filename'),
+                    "file_type": config.get('file_type', 'txt'),
+                    # Include stats for UI restoration
+                    "total_chunks": stats.get('total_chunks', 0),
+                    "completed_chunks": stats.get('completed_chunks', 0),
+                    "last_translation": data.get('last_translation')
                 })
             return sorted(summaries, key=lambda x: x.get('start_time', 0), reverse=True)
 
 
@@ -38,6 +38,14 @@ def emit_update(socketio, translation_id, data_to_emit, state_manager):
             if 'progress' not in data_to_emit and 'progress' in translation_data:
                 data_to_emit['progress'] = translation_data['progress']
 
+            # Store last translation for UI restoration after browser refresh
+            log_entry = data_to_emit.get('log_entry')
+            if (log_entry and log_entry.get('type') == 'llm_response' and
+                log_entry.get('data', {}).get('response')):
+                state_manager.set_translation_field(
+                    translation_id, 'last_translation', log_entry['data']['response']
+                )
+
             socketio.emit('translation_update', data_to_emit, namespace='/')
         except Exception as e:
             print(f"WebSocket emission error for {translation_id}: {e}")
@@ -57,6 +57,7 @@ async def translate(
         llm_provider: str,
         progress_callback: Optional[Callable] = None,
         log_callback: Optional[Callable] = None,
+        stats_callback: Optional[Callable] = None,
         check_interruption_callback: Optional[Callable] = None,
         bilingual_output: bool = False,
         **llm_kwargs
@@ -71,6 +72,7 @@ async def translate(
             llm_provider: LLM provider name (ollama, gemini, openai, openrouter)
             progress_callback: Optional callback for progress updates (receives percentage)
             log_callback: Optional callback for logging (receives type and message)
+            stats_callback: Optional callback for statistics updates (receives dict with total_chunks, completed_chunks, failed_chunks)
             check_interruption_callback: Optional callback to check if translation should be interrupted
             bilingual_output: If True, output will contain both original and translated text
             **llm_kwargs: Additional LLM configuration (endpoint, api_key, etc.)
@@ -100,6 +102,14 @@ async def translate(
             if log_callback:
                 log_callback("units_found", f"Found {total_units} translation units")
 
+            # Send initial stats with total_chunks
+            if stats_callback:
+                stats_callback({
+                    'total_chunks': total_units,
+                    'completed_chunks': 0,
+                    'failed_chunks': 0
+                })
+
             # 3. Check for checkpoint and resume
             resume_from = 0
             checkpoint_data = self.checkpoint_manager.load_checkpoint(self.translation_id)
@@ -109,6 +119,13 @@ async def translate(
                 if log_callback:
                     log_callback("checkpoint_resumed",
                         f"Resuming from unit {resume_from}/{total_units}")
+                # Update stats with resumed progress
+                if stats_callback:
+                    stats_callback({
+                        'total_chunks': total_units,
+                        'completed_chunks': resume_from,
+                        'failed_chunks': 0
+                    })
             else:
                 # 4. Create new translation job
                 self.checkpoint_manager.start_job(
@@ -216,6 +233,14 @@ async def translate(
                             completed_chunks=i + 1
                         )
 
+                        # Update stats
+                        if stats_callback:
+                            stats_callback({
+                                'total_chunks': total_units,
+                                'completed_chunks': i + 1,
+                                'failed_chunks': failed_count
+                            })
+
                         # Update context for next unit
                         last_context = (
                             translated_content[-200:]
@@ -246,6 +271,14 @@ async def translate(
                             failed_chunks=1
                         )
 
+                        # Update stats with failure
+                        if stats_callback:
+                            stats_callback({
+                                'total_chunks': total_units,
+                                'completed_chunks': i,
+                                'failed_chunks': failed_count
+                            })
+
                 except Exception as e:
                     if log_callback:
                         log_callback("unit_error",
@@ -263,6 +296,14 @@ async def translate(
                         failed_chunks=1
                     )
 
+                    # Update stats with failure
+                    if stats_callback:
+                        stats_callback({
+                            'total_chunks': total_units,
+                            'completed_chunks': i,
+                            'failed_chunks': failed_count
+                        })
+
             # 7. Reconstruct output file
             if log_callback:
                 log_callback("reconstruct_start", "Reconstructing output file")
 
@@ -180,10 +180,6 @@ async def translate_file(
         'gemini_api_key': gemini_api_key,
         'openai_api_key': openai_api_key,
         'openrouter_api_key': openrouter_api_key,
-        'progress_callback': progress_callback,
-        'log_callback': log_callback,
-        'stats_callback': stats_callback,
-        'check_interruption_callback': check_interruption_callback,
         'prompt_options': prompt_options,
     }
 
@@ -193,6 +189,10 @@ async def translate_file(
         target_language=target_language,
         model_name=model_name,
         llm_provider=llm_provider,
+        progress_callback=progress_callback,
+        log_callback=log_callback,
+        stats_callback=stats_callback,
+        check_interruption_callback=check_interruption_callback,
         bilingual_output=bilingual_output,
         **llm_config
     )
 
@@ -15,16 +15,18 @@ class CheckpointManager:
     and file storage for uploaded files.
     """
 
-    def __init__(self, db_path: str = "data/jobs.db"):
+    def __init__(self, db_path: str = "data/jobs.db", server_session_id: Optional[str] = None):
         """
         Initialize checkpoint manager.
 
         Args:
             db_path: Path to SQLite database
+            server_session_id: Unique identifier for the current server session
         """
         self.db = Database(db_path)
         self.uploads_dir = Path("data/uploads")
         self.uploads_dir.mkdir(parents=True, exist_ok=True)
+        self.server_session_id = server_session_id
 
     def start_job(
         self,
@@ -49,8 +51,10 @@ def start_job(
         if input_file_path:
             self._preserve_input_file(translation_id, input_file_path, config)
 
-        # Create job in database with updated config
-        success = self.db.create_job(translation_id, file_type, config)
+        # Create job in database with updated config and server session ID
+        success = self.db.create_job(
+            translation_id, file_type, config, self.server_session_id
+        )
 
         return success
 
@@ -263,6 +267,146 @@ def get_resumable_jobs(self) -> List[Dict[str, Any]]:
 
         return jobs
 
+    def reset_running_jobs_on_startup(self) -> int:
+        """
+        Reset jobs with 'running' status from previous server sessions to 'interrupted'.
+
+        Only resets jobs that have a different server_session_id, preserving
+        jobs that are actually running in the current session. This prevents
+        browser refreshes from interrupting active translations.
+
+        This should be called on server startup to handle jobs that were
+        interrupted by a server crash or restart. These jobs will then
+        appear in the resumable jobs list.
+
+        Returns:
+            Number of jobs reset
+        """
+        if not self.server_session_id:
+            # Fallback: if no session ID, don't reset anything to be safe
+            return 0
+        return self.db.reset_running_jobs(self.server_session_id)
+
+    def cleanup_old_jobs(self, max_age_days: int = 30) -> Tuple[int, int]:
+        """
+        Clean up old jobs and their associated files.
+
+        This removes jobs older than max_age_days and cleans up their
+        upload directories to prevent database and disk bloat.
+
+        Args:
+            max_age_days: Maximum age in days for jobs to keep (default 30)
+
+        Returns:
+            Tuple of (jobs_deleted, files_cleaned)
+        """
+        # Get list of old job IDs before deletion (for file cleanup)
+        old_jobs = []
+        try:
+            from datetime import datetime, timedelta
+            cutoff = datetime.now() - timedelta(days=max_age_days)
+
+            # Get jobs that will be deleted
+            all_jobs = self.db.get_resumable_jobs(max_age_days=9999)  # Get all
+            for job in all_jobs:
+                created_str = job.get('created_at', '')
+                if created_str:
+                    try:
+                        created = datetime.fromisoformat(created_str.replace('Z', '+00:00'))
+                        if created.replace(tzinfo=None) < cutoff:
+                            old_jobs.append(job['translation_id'])
+                    except (ValueError, TypeError):
+                        pass
+        except Exception as e:
+            print(f"Warning: Error getting old job list: {e}")
+
+        # Delete from database
+        jobs_deleted = self.db.cleanup_old_jobs(max_age_days)
+
+        # Clean up upload directories for deleted jobs
+        files_cleaned = 0
+        for job_id in old_jobs:
+            job_upload_dir = self.uploads_dir / job_id
+            if job_upload_dir.exists():
+                try:
+                    shutil.rmtree(job_upload_dir)
+                    files_cleaned += 1
+                except Exception as e:
+                    print(f"Warning: Could not delete upload directory for {job_id}: {e}")
+
+        return jobs_deleted, files_cleaned
+
+    def cleanup_orphan_uploads(self) -> int:
+        """
+        Clean up upload files/directories that don't have corresponding jobs in the database.
+
+        These are "orphan" items left behind from previous incomplete cleanups.
+        Handles:
+        - trans_xxx folders (job ID folders)
+        - hash_filename files (legacy upload files)
+
+        Returns:
+            Number of orphan items deleted
+        """
+        orphans_deleted = 0
+
+        if not self.uploads_dir.exists():
+            return 0
+
+        # Get all job IDs and preserved file paths from database
+        try:
+            import sqlite3
+            import json
+            conn = sqlite3.connect(self.db.db_path)
+            conn.row_factory = sqlite3.Row
+            cursor = conn.cursor()
+            cursor.execute("SELECT translation_id, config FROM translation_jobs")
+            db_job_ids = set()
+            preserved_files = set()  # Full file paths that are referenced
+            for row in cursor.fetchall():
+                db_job_ids.add(row['translation_id'])
+                config = json.loads(row['config'])
+                preserved_path = config.get('preserved_input_path', '')
+                if preserved_path:
+                    # Store the filename to check against orphan files
+                    preserved_files.add(Path(preserved_path).name)
+            conn.close()
+        except Exception as e:
+            print(f"Warning: Error getting job IDs: {e}")
+            return 0
+
+        # Check each item in uploads directory
+        for item in self.uploads_dir.iterdir():
+            item_name = item.name
+
+            # Skip test folders
+            if item_name.startswith('test_'):
+                continue
+
+            is_orphan = True
+
+            if item.is_dir():
+                # It's a folder - check if it's a job ID folder
+                if item_name.startswith('trans_'):
+                    if item_name in db_job_ids:
+                        is_orphan = False
+            else:
+                # It's a file - check if it's referenced by any job
+                if item_name in preserved_files:
+                    is_orphan = False
+
+            if is_orphan:
+                try:
+                    if item.is_dir():
+                        shutil.rmtree(item)
+                    else:
+                        item.unlink()
+                    orphans_deleted += 1
+                except Exception as e:
+                    print(f"Warning: Could not delete orphan {item_name}: {e}")
+
+        return orphans_deleted
+
     def mark_paused(self, translation_id: str) -> bool:
         """
         Mark a job as paused (user-initiated stop).