Spaces:

stephanbv
/

multilingual-rag-demo-2

Sleeping

sbv Claude commited on Oct 17, 2025

Commit

2d6c64f

1 Parent(s): b3590f6

Add real-time progress updates via Server-Sent Events

Users now see step-by-step progress during document upload:
⏳ Uploading document...
📄 Converting document to markdown...
🌍 Detecting document language...
✓ Language: Portuguese
✂️ Creating smart chunks...
🤖 Loading Portuguese model (first time, ~30-60s)...
🧠 Generating embeddings...
💾 Storing in vector database...
✅ Ready! Ask your questions below.

Backend changes:
- Add SSE endpoint /api/progress/{session_id} for streaming progress
- Upload endpoint returns immediately and processes in background
- send_progress() helper sends updates through asyncio queue
- Progress messages added throughout document processing flow

Frontend changes:
- Connect to EventSource for real-time progress updates
- Display progress messages as they arrive
- Auto-close connection when processing complete

Benefits:
- Users know exactly what's happening (no more "is it stuck?")
- Clear indication when models are downloading
- Professional UX with real-time feedback

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-Authored-By: Claude <noreply@anthropic.com>

Files changed (2) hide show

backend/main.py +93 -21
frontend/script.js +41 -16

backend/main.py CHANGED Viewed

@@ -1,12 +1,15 @@
 from fastapi import FastAPI, UploadFile, File, Form, HTTPException
 from fastapi.middleware.cors import CORSMiddleware
 from fastapi.staticfiles import StaticFiles
-from fastapi.responses import JSONResponse
 import tempfile
 import os
 from typing import Optional
 import uuid
 import warnings
 # Suppress ChromaDB telemetry warnings
 warnings.filterwarnings("ignore", message=".*capture.*takes 1 positional argument.*")
@@ -46,6 +49,9 @@ app.add_middleware(
 # In-memory storage for sessions
 sessions = {}
 # Language code mapping (Docling uses ISO 639-1, langdetect returns similar codes)
 SUPPORTED_LANGUAGES = {
     'en': 'English',
@@ -134,6 +140,15 @@ def translate_text(text: str, source_lang: str, target_lang: str) -> str:
         return text  # Return original text if translation fails
 class DocumentProcessor:
     """Handles document processing and RAG functionality"""
@@ -160,6 +175,8 @@ class DocumentProcessor:
     def process_document(self, file_path: str, file_extension: str) -> dict:
         """Process document with Docling"""
         try:
             # Check PDF page limit
             if file_extension == "pdf":
                 within_limit, num_pages = self.check_pdf_pages(file_path)
@@ -177,6 +194,8 @@ class DocumentProcessor:
             self.docling_document = result.document
             markdown_content = self.docling_document.export_to_markdown()
             # Extract document language from Docling metadata
             doc_lang = None
             if hasattr(result.document, 'lang') and result.document.lang:
@@ -198,6 +217,8 @@ class DocumentProcessor:
                 print(f"Language from Docling: {doc_lang}")
             self.document_language = doc_lang
             # Estimate pages for non-PDF formats
             if file_extension != "pdf":
@@ -210,9 +231,11 @@ class DocumentProcessor:
             self.document_content = markdown_content
             # Chunk using HybridChunker with document structure
             chunks = self._chunk_with_hybrid_chunker()
             # Create embeddings and store in ChromaDB
             self._create_vector_store(chunks)
@@ -275,6 +298,8 @@ class DocumentProcessor:
             # Lazy-load model if not already loaded
             if self.document_language not in embedding_models:
                 load_language_model(self.document_language)
             # Get the appropriate embedding model for document language
@@ -286,6 +311,7 @@ class DocumentProcessor:
             # Generate embeddings
             embeddings = embedding_model.encode(chunks).tolist()
             # Add to ChromaDB
             ids = [f"chunk_{i}" for i in range(len(chunks))]
             self.collection.add(
@@ -294,6 +320,8 @@ class DocumentProcessor:
                 ids=ids
             )
         except Exception as e:
             raise HTTPException(status_code=500, detail=f"Error creating vector store: {str(e)}")
@@ -395,6 +423,41 @@ async def model_status():
     }
 @app.post("/upload")
 async def upload_document(
     file: UploadFile = File(...),
@@ -425,34 +488,43 @@ async def upload_document(
     # Create session
     session_id = str(uuid.uuid4())
     # Save uploaded file temporarily
     with tempfile.NamedTemporaryFile(delete=False, suffix=f".{file_extension}") as tmp_file:
         content = await file.read()
         tmp_file.write(content)
         tmp_file_path = tmp_file.name
-    try:
-        # Process document
-        processor = DocumentProcessor(session_id)
-        result = processor.process_document(tmp_file_path, file_extension)
-        # Store session
-        sessions[session_id] = {
-            "processor": processor,
-            "api_key": api_key,
-            "filename": file.filename
-        }
-        return {
-            **result,
-            "session_id": session_id,
-            "filename": file.filename
-        }
-    finally:
-        # Clean up temp file
-        if os.path.exists(tmp_file_path):
-            os.unlink(tmp_file_path)
 @app.post("/ask")

 from fastapi import FastAPI, UploadFile, File, Form, HTTPException
 from fastapi.middleware.cors import CORSMiddleware
 from fastapi.staticfiles import StaticFiles
+from fastapi.responses import JSONResponse, StreamingResponse
 import tempfile
 import os
 from typing import Optional
 import uuid
 import warnings
+import asyncio
+import json
+from collections import defaultdict
 # Suppress ChromaDB telemetry warnings
 warnings.filterwarnings("ignore", message=".*capture.*takes 1 positional argument.*")
 # In-memory storage for sessions
 sessions = {}
+# Progress tracking for real-time updates
+progress_queues = defaultdict(asyncio.Queue)
 # Language code mapping (Docling uses ISO 639-1, langdetect returns similar codes)
 SUPPORTED_LANGUAGES = {
     'en': 'English',
         return text  # Return original text if translation fails
+def send_progress(session_id: str, message: str, step: str = ""):
+    """Send progress update to the session's queue"""
+    try:
+        queue = progress_queues[session_id]
+        queue.put_nowait({"message": message, "step": step})
+    except Exception as e:
+        print(f"Error sending progress: {e}")
 class DocumentProcessor:
     """Handles document processing and RAG functionality"""
     def process_document(self, file_path: str, file_extension: str) -> dict:
         """Process document with Docling"""
         try:
+            send_progress(self.session_id, "📄 Converting document to markdown...", "converting")
             # Check PDF page limit
             if file_extension == "pdf":
                 within_limit, num_pages = self.check_pdf_pages(file_path)
             self.docling_document = result.document
             markdown_content = self.docling_document.export_to_markdown()
+            send_progress(self.session_id, "🌍 Detecting document language...", "detecting_language")
             # Extract document language from Docling metadata
             doc_lang = None
             if hasattr(result.document, 'lang') and result.document.lang:
                 print(f"Language from Docling: {doc_lang}")
             self.document_language = doc_lang
+            lang_name = SUPPORTED_LANGUAGES.get(doc_lang, doc_lang.upper())
+            send_progress(self.session_id, f"✓ Language: {lang_name}", "language_detected")
             # Estimate pages for non-PDF formats
             if file_extension != "pdf":
             self.document_content = markdown_content
+            send_progress(self.session_id, "✂️ Creating smart chunks...", "chunking")
             # Chunk using HybridChunker with document structure
             chunks = self._chunk_with_hybrid_chunker()
+            send_progress(self.session_id, "🧠 Generating embeddings...", "embedding")
             # Create embeddings and store in ChromaDB
             self._create_vector_store(chunks)
             # Lazy-load model if not already loaded
             if self.document_language not in embedding_models:
+                lang_name = SUPPORTED_LANGUAGES.get(self.document_language, self.document_language.upper())
+                send_progress(self.session_id, f"🤖 Loading {lang_name} model (first time, ~30-60s)...", "loading_model")
                 load_language_model(self.document_language)
             # Get the appropriate embedding model for document language
             # Generate embeddings
             embeddings = embedding_model.encode(chunks).tolist()
+            send_progress(self.session_id, "💾 Storing in vector database...", "storing")
             # Add to ChromaDB
             ids = [f"chunk_{i}" for i in range(len(chunks))]
             self.collection.add(
                 ids=ids
             )
+            send_progress(self.session_id, "✅ Ready! Ask your questions below.", "complete")
         except Exception as e:
             raise HTTPException(status_code=500, detail=f"Error creating vector store: {str(e)}")
     }
+@app.get("/api/progress/{session_id}")
+async def progress_stream(session_id: str):
+    """Server-Sent Events endpoint for real-time progress updates"""
+    async def event_generator():
+        queue = progress_queues[session_id]
+        try:
+            while True:
+                # Wait for progress message with timeout
+                try:
+                    progress = await asyncio.wait_for(queue.get(), timeout=120.0)
+                    # Send SSE formatted message
+                    yield f"data: {json.dumps(progress)}\n\n"
+                    # If complete, stop streaming
+                    if progress.get('step') == 'complete':
+                        break
+                except asyncio.TimeoutError:
+                    # Send keepalive
+                    yield f": keepalive\n\n"
+        except Exception as e:
+            print(f"Progress stream error: {e}")
+        finally:
+            # Clean up queue
+            if session_id in progress_queues:
+                del progress_queues[session_id]
+    return StreamingResponse(
+        event_generator(),
+        media_type="text/event-stream",
+        headers={
+            "Cache-Control": "no-cache",
+            "Connection": "keep-alive",
+        }
+    )
 @app.post("/upload")
 async def upload_document(
     file: UploadFile = File(...),
     # Create session
     session_id = str(uuid.uuid4())
+    # Send initial progress message
+    send_progress(session_id, "⏳ Uploading document...", "uploading")
     # Save uploaded file temporarily
     with tempfile.NamedTemporaryFile(delete=False, suffix=f".{file_extension}") as tmp_file:
         content = await file.read()
         tmp_file.write(content)
         tmp_file_path = tmp_file.name
+    # Process document in background
+    async def process_in_background():
+        try:
+            processor = DocumentProcessor(session_id)
+            result = processor.process_document(tmp_file_path, file_extension)
+            # Store session
+            sessions[session_id] = {
+                "processor": processor,
+                "api_key": api_key,
+                "filename": file.filename
+            }
+        except Exception as e:
+            send_progress(session_id, f"❌ Error: {str(e)}", "error")
+        finally:
+            # Clean up temp file
+            if os.path.exists(tmp_file_path):
+                os.unlink(tmp_file_path)
+    # Start processing in background
+    asyncio.create_task(process_in_background())
+    # Return immediately with session_id so frontend can connect to SSE
+    return {
+        "session_id": session_id,
+        "filename": file.filename,
+        "status": "processing"
+    }
 @app.post("/ask")

frontend/script.js CHANGED Viewed

@@ -490,6 +490,8 @@ async function handleUpload() {
         return;
     }
     try {
         showLoading(getNestedTranslation('loading.processing'));
         hideStatus();
@@ -499,37 +501,60 @@ async function handleUpload() {
         formData.append('file', file);
         formData.append('api_key', apiKey);
-        // Show model download message after 15 seconds
-        const loadingTimeoutId = setTimeout(() => {
-            showLoading(getNestedTranslation('loading.modelDownload'));
-        }, 15000);
-        // Upload (no timeout - CPU processing can take a while)
-        const response = await fetch(`${API_BASE}/upload`, {
             method: 'POST',
             body: formData
         });
-        clearTimeout(loadingTimeoutId);
         const data = await response.json();
         if (!response.ok) {
             throw new Error(data.detail || 'Upload failed');
         }
-        // Success
-        sessionId = data.session_id;
-        documentNameEl.textContent = data.filename;
-        // Show chat interface
-        chatOverlay.classList.add('active');
     } catch (error) {
         console.error('Upload error:', error);
         showStatus(error.message, 'error');
-    } finally {
         hideLoading();
     }
 }

         return;
     }
+    let eventSource = null;
     try {
         showLoading(getNestedTranslation('loading.processing'));
         hideStatus();
         formData.append('file', file);
         formData.append('api_key', apiKey);
+        // Start upload (returns immediately with session_id)
+        const uploadPromise = fetch(`${API_BASE}/upload`, {
             method: 'POST',
             body: formData
         });
+        // Get session_id from response to connect to progress stream
+        const response = await uploadPromise;
         const data = await response.json();
         if (!response.ok) {
             throw new Error(data.detail || 'Upload failed');
         }
+        // Connect to Server-Sent Events for progress updates
+        const tempSessionId = data.session_id;
+        eventSource = new EventSource(`${API_BASE}/api/progress/${tempSessionId}`);
+        eventSource.onmessage = (event) => {
+            try {
+                const progress = JSON.parse(event.data);
+                // Update loading message with progress
+                showLoading(progress.message);
+                // If complete, finalize
+                if (progress.step === 'complete') {
+                    sessionId = tempSessionId;
+                    documentNameEl.textContent = data.filename;
+                    chatOverlay.classList.add('active');
+                    hideLoading();
+                    eventSource.close();
+                }
+            } catch (e) {
+                console.error('Progress parse error:', e);
+            }
+        };
+        eventSource.onerror = (error) => {
+            console.error('Progress stream error:', error);
+            eventSource.close();
+            // If error but response was OK, show success anyway
+            if (data.session_id) {
+                sessionId = data.session_id;
+                documentNameEl.textContent = data.filename;
+                chatOverlay.classList.add('active');
+                hideLoading();
+            }
+        };
     } catch (error) {
         console.error('Upload error:', error);
         showStatus(error.message, 'error');
         hideLoading();
+        if (eventSource) eventSource.close();
     }
 }