diff --git a/.github/workflows/release.yml b/.github/workflows/release.yml
index 37c06a7..98d9d05 100644
--- a/.github/workflows/release.yml
+++ b/.github/workflows/release.yml
@@ -25,6 +25,7 @@ jobs:
         run: |
           cd backend
           python -m pip install --upgrade pip
+          pip install --no-cache-dir torch==2.4.1+cpu torchaudio==2.4.1+cpu --index-url https://download.pytorch.org/whl/cpu
           pip install -r requirements.txt
 
       - name: Run tests
diff --git a/.gitignore b/.gitignore
index 993dad7..ed0cd39 100644
--- a/.gitignore
+++ b/.gitignore
@@ -162,11 +162,6 @@ docker-compose.override.yml
 # -------------------------
 .DS_Store
 
-backend/storage/*
-!backend/storage/.gitkeep
-
-backend/models/*
-!backend/models/.gitkeep
-
-backend/whisper/*
-!backend/whisper/.gitkeep
+# Faiss index and metadata files
+backend/storage/faiss.index
+backend/storage/metadata.json 
diff --git a/backend/app/embeddings/generate.py b/backend/app/embeddings/generate.py
index fb5ee98..9fe5211 100644
--- a/backend/app/embeddings/generate.py
+++ b/backend/app/embeddings/generate.py
@@ -72,63 +72,61 @@ def _get_clip_model() -> torch.nn.Module:
         local_path = next((p for p in [env_path, repo_local, alt_repo_local] if p and os.path.exists(p)), None)
 
         if local_path:
-            # Check if it's a TorchScript model or state dict
-            # TorchScript models may have hardcoded CUDA references, so we need to be careful
+            # Check file size to detect TorchScript (they're usually small serialized format)
+            # TorchScript models may have hardcoded CUDA references, so we skip them by default
+            import stat
             try:
-                # Try loading as TorchScript first (always force CPU to avoid CUDA issues)
-                model = torch.jit.load(local_path, map_location="cpu")
-                # For TorchScript, we still need preprocess
-                _, preprocess, _ = open_clip.create_model_and_transforms("ViT-B-32", pretrained=False)
-                # Force model to CPU (TorchScript models may have hardcoded CUDA)
-                model = model.cpu()
-                model.eval()
-            except (Exception, RuntimeError) as e:
-                error_str = str(e)
-                # Check if error is CUDA-related - if so, skip this file entirely
-                is_cuda_error = "CUDA" in error_str or "cuda" in error_str.lower()
+                file_size = os.path.getsize(local_path)
+                is_likely_torchscript = file_size < 10 * 1024 * 1024  # Less than 10MB is likely TorchScript
                 
-                if is_cuda_error:
-                    # TorchScript file has hardcoded CUDA - skip it and create fresh model
-                    print(f"Warning: TorchScript model file has hardcoded CUDA references. Skipping file and creating fresh CPU-compatible model.")
+                if is_likely_torchscript:
+                    print(f"Warning: Detected TorchScript model file ({file_size} bytes). Skipping to avoid CUDA hardcoding.")
                     model, preprocess, _ = open_clip.create_model_and_transforms(
                         "ViT-B-32", pretrained="openai"
                     )
                     model = model.to(device)
                 else:
-                    # Fall back to state dict loading or create fresh model
-                    print(f"Loading model from state dict (TorchScript failed: {error_str[:100]})")
+                    # Larger files might be state dicts
                     try:
-                        model, preprocess, _ = open_clip.create_model_and_transforms(
-                            "ViT-B-32", pretrained=False
-                        )
                         checkpoint = torch.load(local_path, map_location="cpu", weights_only=False)
                         if isinstance(checkpoint, dict) and 'state_dict' in checkpoint:
+                            # State dict checkpoint
+                            model, preprocess, _ = open_clip.create_model_and_transforms(
+                                "ViT-B-32", pretrained=False
+                            )
                             model.load_state_dict(checkpoint['state_dict'])
+                            model = model.to(device)
+                            print(f"Loaded model from state dict checkpoint")
                         elif isinstance(checkpoint, dict):
+                            # Attempt to load dict as state
+                            model, preprocess, _ = open_clip.create_model_and_transforms(
+                                "ViT-B-32", pretrained=False
+                            )
                             model.load_state_dict(checkpoint)
+                            model = model.to(device)
+                            print(f"Loaded model from state dict")
                         else:
-                            # If it's not a dict, it might be a TorchScript model object
-                            # Check if it has TorchScript attributes
-                            if hasattr(checkpoint, 'encode_image') and hasattr(checkpoint, 'graph'):
-                                # It's a TorchScript model - skip it
-                                print("Warning: Model file is TorchScript. Creating fresh model for CPU compatibility.")
-                                model, preprocess, _ = open_clip.create_model_and_transforms(
-                                    "ViT-B-32", pretrained="openai"
-                                )
-                            else:
-                                model = checkpoint
-                                _, preprocess, _ = open_clip.create_model_and_transforms("ViT-B-32", pretrained=False)
-                        # Move to device (will be CPU)
-                        model = model.to(device)
-                    except Exception as e2:
-                        # If state dict loading also fails, create a fresh model
-                        print(f"Warning: Could not load model from file. Creating fresh model. Error: {str(e2)[:100]}")
+                            # Unknown format - create fresh model
+                            print(f"Unknown checkpoint format. Creating fresh model.")
+                            model, preprocess, _ = open_clip.create_model_and_transforms(
+                                "ViT-B-32", pretrained="openai"
+                            )
+                            model = model.to(device)
+                    except Exception as e:
+                        print(f"Warning: Could not load checkpoint. Creating fresh model. Error: {str(e)[:100]}")
                         model, preprocess, _ = open_clip.create_model_and_transforms(
                             "ViT-B-32", pretrained="openai"
                         )
                         model = model.to(device)
+            except Exception as e:
+                print(f"Warning: Error checking local model. Creating fresh model. Error: {str(e)[:100]}")
+                model, preprocess, _ = open_clip.create_model_and_transforms(
+                    "ViT-B-32", pretrained="openai"
+                )
+                model = model.to(device)
         else:
             # Download from openai (requires internet on first run)
+            print("No local CLIP model found. Downloading from OpenAI...")
             model, preprocess, _ = open_clip.create_model_and_transforms(
                 "ViT-B-32", pretrained="openai"
             )
@@ -215,7 +213,11 @@ def embed_text(text: Union[str, List[str]]) -> np.ndarray:
 
 
 def embed_image(path: str) -> np.ndarray:
-    """Generate embeddings for image with strict CPU-only mode."""
+    """Generate embeddings for image with strict CPU-only mode.
+    
+    Returns:
+        numpy array of shape (1, 512) containing normalized CLIP image embedding.
+    """
     global _clip_model, _clip_preprocess
     
     # Force CPU-only environment
@@ -242,14 +244,22 @@ def embed_image(path: str) -> np.ndarray:
             try:
                 # Encode image and normalize
                 feats = model.encode_image(batch)
+                # Normalize: feats shape is (1, 512), normalize per-sample
                 feats = feats / feats.norm(dim=-1, keepdim=True)
-                return feats.cpu().numpy().astype(np.float32)
+                result = feats.cpu().numpy().astype(np.float32)
+                
+                # Ensure shape is (1, 512)
+                if result.ndim == 1:
+                    result = result.reshape(1, -1)
+                
+                assert result.shape == (1, 512), f"Expected shape (1, 512), got {result.shape}"
+                return result
+                
             except RuntimeError as e:
                 error_msg = str(e)
                 if "CUDA" in error_msg or "cuda" in error_msg.lower():
                     print("Warning: CUDA operation attempted. Reinitializing in CPU-only mode...")
                     # Reset model to force CPU reinitialization
-                    global _clip_model, _clip_preprocess
                     _clip_model = None
                     _clip_preprocess = None
                     # Retry with fresh CPU model
@@ -258,38 +268,15 @@ def embed_image(path: str) -> np.ndarray:
                     batch = torch.stack([image]).cpu()
                     feats = model.encode_image(batch)
                     feats = feats / feats.norm(dim=-1, keepdim=True)
-                    return feats.cpu().numpy().astype(np.float32)
+                    result = feats.cpu().numpy().astype(np.float32)
+                    if result.ndim == 1:
+                        result = result.reshape(1, -1)
+                    return result
                 raise  # Re-raise if it's not a CUDA error
+                
     except Exception as e:
         print(f"Error processing image {path}: {str(e)}")
         raise
-    
-    try:
-        with torch.no_grad():
-            feats = model.encode_image(batch)
-            feats = feats / feats.norm(dim=-1, keepdim=True)
-    except RuntimeError as e:
-        if "CUDA" in str(e) or "cuda" in str(e).lower():
-            # Model has CUDA hardcoded in TorchScript - need to recreate model
-            print(f"Warning: TorchScript model has hardcoded CUDA references. Recreating model for CPU compatibility.")
-            # Reset global model to force recreation
-            _clip_model = None
-            _clip_preprocess = None
-            
-            # Recreate model (will be CPU-compatible)
-            model, preprocess = get_clip()
-            device = torch.device("cpu")
-            model = model.cpu()
-            batch = batch.cpu()
-            
-            with torch.no_grad():
-                feats = model.encode_image(batch)
-                feats = feats / feats.norm(dim=-1, keepdim=True)
-        else:
-            raise
-    
-    # Always return CPU numpy array
-    return feats.cpu().numpy().astype(np.float32)
 
 
 def embed_audio_segment(transcript: str) -> np.ndarray:
diff --git a/backend/app/index_store.py b/backend/app/index_store.py
index 976cdcb..6e1923e 100644
--- a/backend/app/index_store.py
+++ b/backend/app/index_store.py
@@ -27,7 +27,7 @@ def connect_db():
         CREATE TABLE IF NOT EXISTS vectors (
             id INTEGER PRIMARY KEY AUTOINCREMENT,
             vector_id INTEGER,
-            content TEXT,
+            page_content TEXT,
             file_name TEXT,
             file_type TEXT,
             page_number INTEGER,
@@ -70,12 +70,12 @@ def add_embeddings_with_metadata(embeddings: np.ndarray, metadatas: List[dict])
     for i, meta in enumerate(metadatas):
         cur.execute(
             """
-            INSERT INTO vectors (vector_id, content, file_name, file_type, page_number, timestamp, filepath, width, height, bbox)
+            INSERT INTO vectors (vector_id, page_content, file_name, file_type, page_number, timestamp, filepath, width, height, bbox)
             VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
             """,
             (
                 start_id + i,
-                meta.get("content"),
+                meta.get("page_content"),
                 meta.get("file_name"),
                 meta.get("file_type"),
                 meta.get("page_number"),
@@ -107,7 +107,7 @@ def status() -> dict:
 def rebuild_from_db(dim: int) -> dict:
     conn = connect_db()
     cur = conn.cursor()
-    cur.execute("SELECT rowid, content FROM vectors ORDER BY rowid")
+    cur.execute("SELECT rowid, page_content FROM vectors ORDER BY rowid")
     rows = cur.fetchall()
     conn.close()
     if not rows:
diff --git a/backend/app/ingestion/audio_transcriber.py b/backend/app/ingestion/audio_transcriber.py
index 278d9e9..82ac459 100644
--- a/backend/app/ingestion/audio_transcriber.py
+++ b/backend/app/ingestion/audio_transcriber.py
@@ -1,108 +1,153 @@
-"""
-Audio transcription using Whisper.
+"""Audio transcription using local ASR (whisper/faster-whisper if available).
+
+This module tries to transcribe audio offline using locally installed Whisper
+or faster-whisper backends. If neither is available, it will return an empty
+transcript and the ingestion pipeline will surface an appropriate message.
 """
 
 from __future__ import annotations
 
 import os
-import subprocess
-import tempfile
 from typing import List, Tuple
 from .base import Chunk, _split_text
 
 
-def transcribe_audio_with_whisper_cpp(path: str) -> Tuple[str, List[Tuple[float, float, str]]]:
-    """
-    Transcribe audio using Whisper model.
-    Returns (full_transcript, segments).
-    segments is a list of tuples (start_ms, end_ms, text).
+def _format_timestamp(seconds: float) -> str:
+    """Format seconds as HH:MM:SS or MM:SS string."""
+    try:
+        seconds = float(seconds)
+    except Exception:
+        return ""
+    hours = int(seconds // 3600)
+    minutes = int((seconds % 3600) // 60)
+    secs = int(seconds % 60)
+    if hours > 0:
+        return f"{hours:02d}:{minutes:02d}:{secs:02d}"
+    return f"{minutes:02d}:{secs:02d}"
+
+
+def transcribe_audio_with_whisper(path: str) -> Tuple[str, List[Tuple[float, float, str]]]:
+    """Transcribe audio using available local Whisper implementation.
+
+    Returns (full_transcript, segments) where segments is a list of
+    (start_seconds, end_seconds, text).
     """
+    # Try openai/whisper first
     try:
         import whisper
-        import torch
-        import numpy as np
-        
-        # Force CPU mode for consistency
-        device = "cpu"
-        
-        # Load model with absolute path
-        model_path = os.path.abspath(os.path.join(os.path.dirname(__file__), "..", "..", "models", "whisper"))
-        model = whisper.load_model("base", download_root=model_path, device=device)
-        
-        # Transcribe audio
-        result = model.transcribe(path, language=None)
-        
-        # Extract transcript and segments
+        print(f"[Audio] Loading openai-whisper model 'base'...")
+        model = whisper.load_model("base", device="cpu")
+        print(f"[Audio] Transcribing {path}...")
+        result = model.transcribe(path)
         transcript = result.get("text", "").strip()
         segments = []
-        
-        # Process segments if available
         for seg in result.get("segments", []):
+            start = seg.get("start", 0.0)
+            end = seg.get("end", 0.0)
             text = seg.get("text", "").strip()
             if text:
-                start = seg.get("start", 0)
-                end = seg.get("end", 0)
-                segments.append((start, end, text))
-                
+                segments.append((float(start), float(end), text))
+        print(f"[Audio] Transcription complete. Length: {len(transcript)} chars.")
         return transcript, segments
+    except ImportError:
+        print("[Audio] openai-whisper not installed.")
+    except Exception as e:
+        print(f"[Audio] openai-whisper failed: {e}")
+
+    # Try faster-whisper if installed (it often works well offline)
+    try:
+        from faster_whisper import WhisperModel
+        print(f"[Audio] Loading faster-whisper model...")
+        model_size = "small"
+        model_dir = os.path.abspath(os.path.join(os.path.dirname(__file__), "..", "..", "models", "whisper"))
+        model = WhisperModel(model_dir, device="cpu", compute_type="int8_float16")
+        segments_iter, info = model.transcribe(path, beam_size=5)
+        transcript_parts = []
+        segments = []
+        for segment in segments_iter:
+            start = float(segment.start)
+            end = float(segment.end)
+            text = segment.text.strip()
+            if text:
+                transcript_parts.append(text)
+                segments.append((start, end, text))
+        return " ".join(transcript_parts), segments
+    except ImportError:
+        print("[Audio] faster-whisper not installed.")
     except Exception as e:
-        print(f"Error transcribing audio: {str(e)}")
-        pass
+        print(f"[Audio] faster-whisper failed: {e}")
+
+    # If no local ASR available, return empty results (ingestion will handle fallback)
+    print("[Audio] No ASR backend available or all failed.")
     return "", []
 
 
 def transcribe_audio(path: str, file_name: str) -> List[Chunk]:
-    """Transcribe audio file and create chunks with timestamps."""
-    transcript, segments = transcribe_audio_with_whisper_cpp(path)
+    """Transcribe audio file and return a list of Chunk objects with timestamps.
+
+    Each chunk will have attributes:
+      - content: transcript text
+      - file_name, file_type='audio', filepath
+      - start_ts (float seconds), end_ts (float seconds)
+      - timestamp (formatted start time string)
+    """
+    transcript, segments = transcribe_audio_with_whisper(path)
     chunks: List[Chunk] = []
-    
-    if not transcript or transcript.strip() == "":
-        # If transcription failed, return empty list
-        return chunks
-    
-    # Split transcript into chunks
-    split_chunks = _split_text(transcript)
-    
-    # Map chunks to segments for timestamp assignment
-    segment_idx = 0
-    char_pos = 0
-    
-    for i, ch in enumerate(split_chunks):
-        # Find corresponding segment for this chunk
-        chunk_start = char_pos
-        chunk_end = char_pos + len(ch)
-        
-        # Find segment that contains this chunk
-        timestamp_str = None
-        for seg_start, seg_end, seg_text in segments:
-            seg_char_start = sum(len(seg[2]) + 1 for seg in segments[:segments.index((seg_start, seg_end, seg_text))])
-            seg_char_end = seg_char_start + len(seg_text)
-            
-            if chunk_start >= seg_char_start and chunk_start < seg_char_end:
-                # Format timestamp as "HH:MM:SS" or "MM:SS"
-                if seg_start is not None and seg_end is not None:
-                    start_sec = seg_start / 1000.0
-                    end_sec = seg_end / 1000.0
-                    hours = int(start_sec // 3600)
-                    minutes = int((start_sec % 3600) // 60)
-                    seconds = int(start_sec % 60)
-                    if hours > 0:
-                        timestamp_str = f"{hours:02d}:{minutes:02d}:{seconds:02d}"
-                    else:
-                        timestamp_str = f"{minutes:02d}:{seconds:02d}"
-                break
-        
-        c = Chunk(
-            content=ch, 
-            file_name=file_name, 
-            file_type="audio", 
+
+    if not segments:
+        # If ASR failed, create a single placeholder chunk to surface the file
+        placeholder = Chunk(
+            content="[Transcription unavailable: please install a local ASR model (whisper or faster-whisper)]",
+            file_name=file_name,
+            file_type="audio",
             filepath=path,
-            timestamp=timestamp_str  # Store timestamp in Chunk
+            timestamp=None
         )
-        # Also store segments for reference
-        setattr(c, "segments", segments)
-        chunks.append(c)
-        
-        char_pos = chunk_end
-    
+        setattr(placeholder, "start_ts", None)
+        setattr(placeholder, "end_ts", None)
+        chunks.append(placeholder)
+        return chunks
+
+    # For each segment returned by ASR, split further if needed and assign timestamps
+    for seg_start, seg_end, seg_text in segments:
+        seg_text = (seg_text or "").strip()
+        if not seg_text:
+            continue
+
+        # Split long segment text into subchunks while preserving approximate timestamps
+        subchunks = _split_text(seg_text, min_size=100, max_size=400)
+        if not subchunks:
+            subchunks = [seg_text]
+
+        total_chars = sum(len(s) for s in subchunks)
+        if total_chars == 0:
+            continue
+
+        # Distribute timestamp range proportionally across subchunks
+        seg_duration = max(0.0, float(seg_end) - float(seg_start))
+        char_cursor = 0
+        for sub in subchunks:
+            proportion = len(sub) / total_chars
+            start_offset = (char_cursor / total_chars) * seg_duration
+            end_offset = ((char_cursor + len(sub)) / total_chars) * seg_duration
+            start_ts = float(seg_start) + start_offset
+            end_ts = float(seg_start) + end_offset
+
+            ts_str = _format_timestamp(start_ts)
+
+            c = Chunk(
+                content=sub,
+                file_name=file_name,
+                file_type="audio",
+                filepath=path,
+                timestamp=ts_str
+            )
+            setattr(c, "start_ts", start_ts)
+            setattr(c, "end_ts", end_ts)
+            setattr(c, "char_start", None)
+            setattr(c, "char_end", None)
+            chunks.append(c)
+
+            char_cursor += len(sub)
+
     return chunks
diff --git a/backend/app/ingestion/image_processor.py b/backend/app/ingestion/image_processor.py
index 1c38353..b08eab6 100644
--- a/backend/app/ingestion/image_processor.py
+++ b/backend/app/ingestion/image_processor.py
@@ -5,38 +5,77 @@
 from __future__ import annotations
 
 import os
+import logging
 from typing import List, Optional
 from PIL import Image
 from .base import Chunk
 from ..image_utils import get_image_size
 
+logger = logging.getLogger(__name__)
+
 
 def detect_text_in_image(path: str) -> str:
-    """Extract text from image using OCR (optional pytesseract)."""
+    """Extract text from image using OCR (optional pytesseract).
+    
+    Returns:
+        Extracted text string, or empty string if OCR is not available or fails.
+    """
     try:
         import pytesseract
+        logger.debug(f"Attempting OCR on image: {path}")
         image = Image.open(path)
         text = pytesseract.image_to_string(image)
-        return text.strip()
+        extracted = text.strip()
+        if extracted:
+            logger.debug(f"Successfully extracted {len(extracted)} characters via OCR")
+        return extracted
     except ImportError:
-        # pytesseract not available, return empty
+        # pytesseract not available - use fallback description
+        logger.debug("pytesseract not available. Using filename-based description.")
         return ""
-    except Exception:
+    except Exception as e:
+        # Log but don't fail - continue processing without OCR
+        logger.warning(f"OCR extraction failed for {path}: {e}")
         return ""
 
 
 def image_to_embedding(path: str, file_name: str) -> List[Chunk]:
-    """Process image and create chunk for embedding."""
+    """Process image and create chunk for embedding with rich content.
+    
+    The chunk content includes:
+    1. Image filename (always)
+    2. OCR text if available (extracted via Tesseract)
+    3. A semantic description hint
+    
+    This ensures that both visual (via CLIP embedding) and textual (via OCR) 
+    aspects of the image are indexed and retrievable.
+    """
     try:
         w, h = get_image_size(path)
-    except Exception:
+    except Exception as e:
+        logger.warning(f"Could not get image dimensions for {path}: {e}")
         w, h = None, None
     
-    # Try OCR if available
+    # Extract OCR text from image (if pytesseract available)
     ocr_text = detect_text_in_image(path)
     
+    # Build rich content description for the image chunk
+    content_parts = [f"Image: {file_name}"]
+    
+    # Add OCR text as primary content if available
+    if ocr_text:
+        content_parts.append(f"OCR Text: {ocr_text}")
+    else:
+        # Add dimensional hints for retrieval if no OCR
+        if w and h:
+            content_parts.append(f"Dimensions: {w}x{h} pixels")
+    
+    # Combine content - this will be embedded by CLIP (image embedding)
+    # and also used for text search in vector store
+    full_content = " | ".join(content_parts)
+    
     ch = Chunk(
-        content=f"Image: {file_name}" + (f" | OCR: {ocr_text}" if ocr_text else ""),
+        content=full_content,
         file_name=file_name, 
         file_type="image", 
         filepath=path,
diff --git a/backend/app/llm/prompts.py b/backend/app/llm/prompts.py
index 3e2157e..7d20554 100644
--- a/backend/app/llm/prompts.py
+++ b/backend/app/llm/prompts.py
@@ -26,7 +26,7 @@
 
 
 def build_prompt(query: str, sources: List[Dict[str, Any]]) -> str:
-    """Build a comprehensive prompt with context sources."""
+    """Build a comprehensive prompt with context sources, optimized for multimodal content."""
     if not sources:
         return f"USER QUESTION: {query}\n\nAnswer: I don't have any relevant information to answer this question."
     
@@ -35,20 +35,29 @@ def build_prompt(query: str, sources: List[Dict[str, Any]]) -> str:
         # Build source description
         source_desc = f"[{i}] "
         
-        # Add file information
+        # Add file information and modality indicator
         file_name = source.get('file_name', 'Unknown')
         file_type = source.get('file_type', 'unknown')
-        source_desc += f"{file_name} ({file_type})"
+        modality = source.get('modality', file_type)
+        
+        source_desc += f"{file_name}"
+        
+        # Add modality hint for better LLM context
+        if file_type == 'image':
+            source_desc += " (Screenshot/Image)"
+        elif file_type == 'pdf':
+            source_desc += " (PDF Document)"
+        elif file_type == 'audio':
+            source_desc += " (Audio)"
         
         # Add location information
         if file_type == 'pdf' and source.get('page_number'):
             source_desc += f" - Page {source['page_number']}"
         elif file_type == 'audio' and source.get('timestamp'):
             source_desc += f" - {source['timestamp']}"
-        elif file_type == 'image':
-            source_desc += " - Image"
         
         # Add content snippet
+        # For images, we want OCR text to be prominent
         content = source.get('content', '').strip()
         if content:
             # Truncate very long content
@@ -56,6 +65,12 @@ def build_prompt(query: str, sources: List[Dict[str, Any]]) -> str:
                 content = content[:500] + "..."
             source_desc += f": {content}"
         
+        # If no content but we have OCR text in metadata, show it
+        # (for backward compatibility, also check for ocr_text field)
+        ocr_text = source.get('ocr_text', '')
+        if ocr_text and not content:
+            source_desc += f": (OCR) {ocr_text}"
+        
         context_lines.append(source_desc)
     
     context_sources = "\n".join(context_lines)
@@ -88,7 +103,7 @@ def build_simple_prompt(query: str, sources: List[Dict[str, Any]]) -> str:
 
 
 def build_multimodal_prompt(query: str, sources: List[Dict[str, Any]]) -> str:
-    """Build prompt optimized for multimodal content."""
+    """Build prompt optimized for multimodal content with proper image handling."""
     if not sources:
         return f"Question: {query}\nAnswer: I don't have any relevant information."
     
@@ -107,31 +122,55 @@ def build_multimodal_prompt(query: str, sources: List[Dict[str, Any]]) -> str:
             text_sources.append(source)
     
     prompt_parts = []
+    counter = 1
     
     if text_sources:
         prompt_parts.append("TEXT SOURCES:")
-        for i, source in enumerate(text_sources, start=1):
+        for source in text_sources:
             content = source.get('content', '').strip()
             file_name = source.get('file_name', 'Unknown')
-            prompt_parts.append(f"[{i}] {file_name}: {content}")
+            if content:
+                if len(content) > 300:
+                    content = content[:300] + "..."
+                prompt_parts.append(f"[{counter}] {file_name}: {content}")
+            counter += 1
     
     if image_sources:
-        prompt_parts.append("\nIMAGE SOURCES:")
-        for i, source in enumerate(image_sources, start=len(text_sources) + 1):
+        prompt_parts.append("\nIMAGE SOURCES (Screenshots/Diagrams):")
+        for source in image_sources:
+            # For images, the content field should already contain OCR text (from image_processor.py)
             content = source.get('content', '').strip()
             file_name = source.get('file_name', 'Unknown')
-            prompt_parts.append(f"[{i}] {file_name}: {content}")
+            
+            # Fallback to ocr_text field if available and content is just the filename
+            ocr_text = source.get('ocr_text', '')
+            if not content or content.startswith('Image:'):
+                if ocr_text:
+                    content = ocr_text
+                else:
+                    content = "(Image - describe based on filename and any visible elements)"
+            
+            if len(content) > 300:
+                content = content[:300] + "..."
+            
+            # Make image source more distinct for the LLM
+            prompt_parts.append(f"[{counter}] {file_name} (IMAGE): {content}")
+            counter += 1
     
     if audio_sources:
-        prompt_parts.append("\nAUDIO SOURCES:")
-        for i, source in enumerate(audio_sources, start=len(text_sources) + len(image_sources) + 1):
+        prompt_parts.append("\nAUDIO SOURCES (Transcripts):")
+        for source in audio_sources:
             content = source.get('content', '').strip()
             file_name = source.get('file_name', 'Unknown')
             timestamp = source.get('timestamp', '')
-            if timestamp:
-                prompt_parts.append(f"[{i}] {file_name} ({timestamp}): {content}")
-            else:
-                prompt_parts.append(f"[{i}] {file_name}: {content}")
+            if content:
+                if len(content) > 300:
+                    content = content[:300] + "..."
+                if timestamp:
+                    prompt_parts.append(f"[{counter}] {file_name} ({timestamp}): {content}")
+                else:
+                    prompt_parts.append(f"[{counter}] {file_name}: {content}")
+            counter += 1
     
     context = "\n".join(prompt_parts)
     
@@ -141,4 +180,11 @@ def build_multimodal_prompt(query: str, sources: List[Dict[str, Any]]) -> str:
 
 Question: {query}
 
-Answer based on the provided sources. Use [1], [2], etc. for citations. If information is missing, say so."""
+Important Instructions:
+1. Use ONLY information from the sources [1] through [{counter-1}]
+2. For image sources, describe what they show based on the text/OCR content provided
+3. Cite sources inline using [1], [2], [3], etc.
+4. If information is not in the sources, say "I don't have that information in the provided sources"
+5. Be specific and accurate in your answers
+
+Answer:"""
diff --git a/backend/app/main.py b/backend/app/main.py
index 35c1289..585fe08 100644
--- a/backend/app/main.py
+++ b/backend/app/main.py
@@ -116,10 +116,28 @@ async def ingest(file: UploadFile = File(...)):
             )
         
         if not chunks:
-            raise HTTPException(
-                status_code=422,
-                detail=f"No content could be extracted from {file.filename}. The file may be corrupted or in an unsupported format."
-            )
+            # If the uploaded file is audio, don't fail the whole ingestion when
+            # transcription cannot be performed (missing ASR/model). Instead,
+            # create a placeholder audio chunk so the file is still indexed and
+            # can be surfaced to the user with a message about transcription.
+            audio_exts = ('.mp3', '.wav', '.m4a', '.flac', '.ogg')
+            if file.filename.lower().endswith(audio_exts):
+                from .ingestion.base import Chunk
+                placeholder = Chunk(
+                    content="[Transcription unavailable: install a local ASR model (whisper or faster-whisper) to enable transcripts]",
+                    file_name=file.filename,
+                    file_type="audio",
+                    filepath=dest_path,
+                    timestamp=None
+                )
+                setattr(placeholder, 'start_ts', None)
+                setattr(placeholder, 'end_ts', None)
+                chunks = [placeholder]
+            else:
+                raise HTTPException(
+                    status_code=422,
+                    detail=f"No content could be extracted from {file.filename}. The file may be corrupted or in an unsupported format."
+                )
         
         # Generate embeddings and store using new vector store
         try:
@@ -162,14 +180,16 @@ async def ingest(file: UploadFile = File(...)):
                             'file_name': chunk.file_name,
                             'file_type': chunk.file_type,
                             'page_number': chunk.page_number,
-                            'timestamp': chunk.timestamp,
+                                'timestamp': chunk.timestamp,
+                                'start_ts': getattr(chunk, 'start_ts', None),
+                                'end_ts': getattr(chunk, 'end_ts', None),
                             'filepath': chunk.filepath,
                             'width': getattr(chunk, 'width', None),
                             'height': getattr(chunk, 'height', None),
                             'bbox': getattr(chunk, 'bbox', None),
                             'char_start': getattr(chunk, 'char_start', None),
                             'char_end': getattr(chunk, 'char_end', None),
-                            'modality': chunk.file_type
+                                'modality': chunk.file_type
                         }
                     })
             except Exception as e:
@@ -193,6 +213,8 @@ async def ingest(file: UploadFile = File(...)):
                         'file_type': chunk.file_type,
                         'page_number': chunk.page_number,
                         'timestamp': chunk.timestamp,
+                        'start_ts': getattr(chunk, 'start_ts', None),
+                        'end_ts': getattr(chunk, 'end_ts', None),
                         'filepath': chunk.filepath,
                         'width': getattr(chunk, 'width', None),
                         'height': getattr(chunk, 'height', None),
@@ -270,16 +292,34 @@ def query(payload: dict):
             file_type = r.get("modality", r.get("file_type", "text"))
             page_num = r.get("page_number")
             timestamp = r.get("timestamp")
-            
+            start_ts = r.get("start_ts")
+            end_ts = r.get("end_ts")
+
             # Build URL efficiently
             url = None
             if file_name:
                 base_path = f"/files/{file_name}"
                 if file_type == "pdf" and page_num is not None:
                     url = f"{base_path}#page={page_num}"
-                elif file_type == "audio" and timestamp:
-                    # URL-safe timestamp encoding
-                    url = f"{base_path}#t={timestamp.replace(':', '')}"
+                elif file_type == "audio":
+                    # Prefer numeric start_ts if available, otherwise fall back to timestamp string
+                    ts_str = None
+                    if start_ts is not None:
+                        # format seconds to HH:MM:SS
+                        try:
+                            s = int(start_ts)
+                            h = s // 3600
+                            m = (s % 3600) // 60
+                            sec = s % 60
+                            ts_str = f"{h:02d}:{m:02d}:{sec:02d}" if h > 0 else f"{m:02d}:{sec:02d}"
+                        except Exception:
+                            ts_str = None
+                    if not ts_str and timestamp:
+                        ts_str = timestamp
+                    if ts_str:
+                        url = f"{base_path}#timestamp={ts_str}"
+                    else:
+                        url = base_path
                 elif file_type == "image":
                     url = base_path
                 else:
diff --git a/backend/app/rag.py b/backend/app/rag.py
index 78b769e..713a45a 100644
--- a/backend/app/rag.py
+++ b/backend/app/rag.py
@@ -42,7 +42,7 @@ def similarity_search(query: str, k: int) -> List[Dict]:
     cur = conn.cursor()
     placeholders = ",".join(["?"] * len(ids))
     cur.execute(
-        f"SELECT vector_id, content, file_name, file_type, page_number, timestamp, filepath FROM vectors WHERE vector_id IN ({placeholders})",
+        f"SELECT vector_id, page_content, file_name, file_type, page_number, timestamp, filepath FROM vectors WHERE vector_id IN ({placeholders})",
         ids,
     )
     rows = cur.fetchall()
@@ -56,7 +56,7 @@ def similarity_search(query: str, k: int) -> List[Dict]:
         results.append(
             {
                 "vector_id": r[0],
-                "content": r[1],
+                "page_content": r[1],
                 "file_name": r[2],
                 "file_type": r[3],
                 "page_number": r[4],
@@ -77,7 +77,7 @@ def build_prompt(query: str, sources: List[Dict]) -> str:
             where += f" page {s['page_number']}"
         if s.get("file_type") == "audio" and s.get("timestamp"):
             where += f" {s['timestamp']}"
-        snippet = (s.get("content") or "").replace("\n", " ")
+        snippet = (s.get("page_content") or "").replace("\n", " ")
         lines.append(f"Source {marker} {where}: \"{snippet}\"")
     lines.append("\nAnswer the user query using only the information from sources [1..k]. Provide citations inline like [1], [2]. If the answer is unknown from sources, say you don't know.")
     lines.append(f"\nUser query: {query}\nAnswer:")
@@ -97,7 +97,7 @@ def answer_query(cfg_path: str, query: str) -> dict:
             {
                 "id": i,
                 "file_name": s.get("file_name"),
-                "snippet": s.get("content"),
+                "snippet": s.get("page_content"),
                 "page_number": s.get("page_number"),
                 "timestamp": s.get("timestamp"),
                 "score": s.get("score"),
diff --git a/backend/app/vector_store/faiss_store.py b/backend/app/vector_store/faiss_store.py
index d2549b3..4157b78 100644
--- a/backend/app/vector_store/faiss_store.py
+++ b/backend/app/vector_store/faiss_store.py
@@ -121,11 +121,13 @@ def upsert(self, items: List[Dict[str, Any]]) -> int:
             vector_id = start_id + i
             self.metadata[str(vector_id)] = {
                 'vector_id': vector_id,
-                'content': metadata.get('content', ''),
+                'page_content': metadata.get('page_content', ''),
                 'file_name': metadata.get('file_name', ''),
                 'file_type': metadata.get('file_type', ''),
                 'page_number': metadata.get('page_number'),
                 'timestamp': metadata.get('timestamp'),
+                'start_ts': metadata.get('start_ts'),
+                'end_ts': metadata.get('end_ts'),
                 'filepath': metadata.get('filepath'),
                 'width': metadata.get('width'),
                 'height': metadata.get('height'),
@@ -217,9 +219,27 @@ def rebuild_from_metadata(self):
         # This would require re-computing embeddings from original content
         # For now, just reinitialize with current dimension
         self.index = faiss.IndexFlatIP(self.dimension)
+        
+        # Get all embeddings and IDs from metadata
+        embeddings = []
+        ids = []
+        for vector_id, meta in self.metadata.items():
+            # Assuming 'page_content' holds the text for embedding
+            text_to_embed = meta.get('page_content', '')
+            if text_to_embed:
+                # Re-create embedding. This requires access to an embedding function.
+                # This is a placeholder for where you'd call your embedding function.
+                # from ..embeddings import embed_text
+                # embedding = embed_text(text_to_embed)
+                # embeddings.append(embedding)
+                # ids.append(int(vector_id))
+                pass  # Placeholder for re-embedding logic
+    
+        # if embeddings:
+        #     self.index.add_with_ids(np.array(embeddings), np.array(ids))
+        
         self._persist_index()
 
-
 # Global store instance for backward compatibility
 _store_instance: Optional[FAISSStore] = None
 
diff --git a/backend/requirements.txt b/backend/requirements.txt
index 367ea45..a24fbfb 100644
--- a/backend/requirements.txt
+++ b/backend/requirements.txt
@@ -8,9 +8,9 @@ sentence-transformers==3.0.1
 PyMuPDF==1.24.10
 python-docx==1.1.2
 Pillow==10.4.0
-torch==2.4.1
+# torch==2.4.1
 open-clip-torch==2.26.1
-torchaudio==2.4.1
+# torchaudio==2.4.1
 rich==13.8.1
 
 aiohttp==3.10.5
@@ -32,3 +32,7 @@ pytest==7.4.3
 pytest-asyncio==0.21.1
 
 
+
+# Audio Transcription
+openai-whisper==20231117
+ffmpeg-python==0.2.0
diff --git a/backend/scripts/test_audio_pipeline.py b/backend/scripts/test_audio_pipeline.py
new file mode 100644
index 0000000..dee0b73
--- /dev/null
+++ b/backend/scripts/test_audio_pipeline.py
@@ -0,0 +1,85 @@
+"""End-to-end test script for the audio ingestion pipeline.
+
+This script is intended to be runnable locally. It:
+ - Creates a short synthetic WAV file in storage
+ - Calls the ingestion/transcription pipeline directly
+ - Embeds transcript segments using the unified embed_text()
+ - Indexes embeddings in FAISS
+ - Performs a simple search to verify vectors are searchable
+
+The script is tolerant of missing ASR backends: if no local ASR is available,
+the pipeline will insert a placeholder chunk and indexing will still succeed.
+"""
+
+import os
+import wave
+import struct
+import tempfile
+import numpy as np
+
+from backend.app.ingestion.audio_transcriber import transcribe_audio
+from backend.app.embeddings.generate import embed_text
+from backend.app.vector_store.faiss_store import get_store, upsert, search
+
+
+def generate_silent_wav(path: str, duration_sec: float = 1.0, rate: int = 16000):
+    n_samples = int(duration_sec * rate)
+    amplitude = 0
+    with wave.open(path, 'w') as wf:
+        wf.setnchannels(1)
+        wf.setsampwidth(2)
+        wf.setframerate(rate)
+        frames = (struct.pack('<h', 0) for _ in range(n_samples))
+        wf.writeframes(b''.join(frames))
+
+
+def main():
+    storage_dir = os.path.abspath(os.path.join(os.path.dirname(__file__), '..', '..', 'storage'))
+    os.makedirs(storage_dir, exist_ok=True)
+    wav_path = os.path.join(storage_dir, 'test_silent.wav')
+    generate_silent_wav(wav_path, duration_sec=1.0)
+
+    print(f"Generated test WAV: {wav_path}")
+
+    chunks = transcribe_audio(wav_path, 'test_silent.wav')
+    print(f"Transcription produced {len(chunks)} chunk(s)")
+    for c in chunks:
+        print('---')
+        print('content:', c.content)
+        print('timestamp:', getattr(c, 'timestamp', None))
+        print('start_ts:', getattr(c, 'start_ts', None))
+        print('end_ts:', getattr(c, 'end_ts', None))
+
+    # Embed and index
+    store = get_store()
+    items = []
+    for c in chunks:
+        emb = embed_text(c.content)
+        if emb.ndim == 2:
+            emb = emb[0]
+        items.append({
+            'embedding': emb,
+            'metadata': {
+                'content': c.content,
+                'file_name': c.file_name,
+                'file_type': c.file_type,
+                'timestamp': getattr(c, 'timestamp', None),
+                'start_ts': getattr(c, 'start_ts', None),
+                'end_ts': getattr(c, 'end_ts', None),
+                'filepath': c.filepath,
+                'modality': 'audio'
+            }
+        })
+
+    upsert(items)
+    print('Indexed items:', len(items))
+
+    # Simple search for "transcription" to see if placeholder appears
+    q = 'transcription'
+    q_emb = embed_text(q)
+    results = store.search(q_emb, top_k=5)
+    print('Search results:', results[:3])
+
+
+if __name__ == '__main__':
+    main()
diff --git a/download_whisper.py b/download_whisper.py
deleted file mode 100644
index 788e7c5..0000000
--- a/download_whisper.py
+++ /dev/null
@@ -1,12 +0,0 @@
-import os
-import whisper
-from pathlib import Path
-
-# Set up paths
-model_dir = Path("backend/models/whisper")
-model_dir.mkdir(parents=True, exist_ok=True)
-
-# Download the model
-print("Downloading Whisper model...")
-model = whisper.load_model("base")
-print("Model downloaded successfully!")
\ No newline at end of file
diff --git a/frontend/src/App.jsx b/frontend/src/App.jsx
index 04c8ee5..1fef848 100644
--- a/frontend/src/App.jsx
+++ b/frontend/src/App.jsx
@@ -1,17 +1,9 @@
 import { useEffect, useState } from "react";
 import ChatUI from "./components/ChatUI";
-import Uploader from "./Uploader";
 import ContextViewer from "./components/ContextViewer";
 import SourceModal from "./components/SourceModal";
-import Header from "./components/Header";
-import {
-  Sheet,
-  SheetContent,
-  SheetHeader,
-  SheetTitle,
-  SheetTrigger,
-} from "./components/ui/sheet";
-import { Menu, X, FileText, Database } from "lucide-react";
+import { Sheet, SheetContent, SheetTrigger } from "./components/ui/sheet";
+import { Menu, X, Database } from "lucide-react";
 
 function App() {
   const [messages, setMessages] = useState([]);
@@ -21,11 +13,14 @@ function App() {
   const [isOnline, setIsOnline] = useState(navigator.onLine);
   const [showSidebar, setShowSidebar] = useState(true);
   const [indexedDocs, setIndexedDocs] = useState(0);
-  const [dark, setDark] = useState(() => {
-    if (typeof window === "undefined") return false;
-    const saved = localStorage.getItem("theme-dark");
-    return saved ? JSON.parse(saved) : false;
-  });
+  const [isDarkMode, setIsDarkMode] = useState(true);
+
+  // Static chat history for demo
+  const [chatHistory] = useState([
+    { id: 1, title: "What is RAG?", date: "Today" },
+    { id: 2, title: "Document analysis help", date: "Yesterday" },
+    { id: 3, title: "Audio transcription query", date: "Nov 20" },
+  ]);
 
   // Monitor online/offline status
   useEffect(() => {
@@ -35,7 +30,7 @@ function App() {
         ...prev,
         {
           role: "system",
-          content: "✅ Connection restored. You're back online!",
+          content: "Connection restored. You're back online!",
         },
       ]);
     };
@@ -46,7 +41,8 @@ function App() {
         ...prev,
         {
           role: "system",
-          content: "📴 You're offline. Don't worry, you can still query your uploaded documents!",
+          content:
+            "You're offline. Don't worry, you can still query your uploaded documents!",
         },
       ]);
     };
@@ -60,19 +56,7 @@ function App() {
     };
   }, []);
 
-  useEffect(() => {
-    document.documentElement.classList.toggle("dark", dark);
-    localStorage.setItem("theme-dark", JSON.stringify(dark));
-  }, [dark]);
-
   // Welcome message on first load
-  useEffect(() => {
-    if (messages.length === 0) {
-      setMessages([
-        
-      ]);
-    }
-  }, []);
 
   const handleSend = async (text) => {
     setMessages((prev) => [...prev, { role: "user", content: text }]);
@@ -88,7 +72,7 @@ function App() {
       if (!res.ok) throw new Error("Query failed");
 
       const data = await res.json();
-      
+
       setMessages((prev) => [
         ...prev,
         {
@@ -110,176 +94,368 @@ function App() {
         {
           role: "assistant",
           content: isOnline
-            ? "❌ Sorry, I couldn't connect to the server. Please check if the backend is running."
-            : "📴 You're offline. Make sure your documents are already indexed to query them.",
+            ? "Sorry, I couldn't connect to the server. Please check if the backend is running."
+            : "You're offline. Make sure your documents are already indexed to query them.",
         },
       ]);
     }
     setIsTyping(false);
   };
 
-  const doSearch = async (query) => {
-    if (!query || !query.trim()) {
-      setResults([]);
-      return;
-    }
-    try {
-      const res = await fetch("http://localhost:8000/search/similarity", {
-        method: "POST",
-        headers: { "Content-Type": "application/json" },
-        body: JSON.stringify({ query, k: 8 }),
-      });
-      const data = await res.json();
-      setResults(data.results || []);
-    } catch (e) {
-      console.error("Search failed:", e);
-    }
-  };
-
   const handleUploadComplete = (data) => {
     setIndexedDocs((prev) => prev + 1);
     setMessages((prev) => [
       ...prev,
       {
         role: "system",
-        content: `✅ Successfully indexed: ${data.file || "document"}\n📊 Vectors indexed: ${data.vectors_indexed || 0}`,
+        content: `Successfully indexed: ${
+          data.file || "document"
+        }\nVectors indexed: ${data.vectors_indexed || 0}`,
       },
     ]);
   };
 
- return (
-  <div className="flex min-h-screen flex-col bg-background">
-    <Header dark={dark} setDark={setDark} isOnline={isOnline} />
+  return (
+    <div
+      className={`flex h-screen w-full overflow-hidden ${
+        isDarkMode ? "bg-gray-900" : "bg-white"
+      }`}
+    >
+      {/* Mobile Navigation */}
+      <div className="lg:hidden fixed top-4 left-4 z-50">
+        <Sheet>
+          <SheetTrigger asChild>
+            <button
+              className={`p-2 rounded-md transition-colors ${
+                isDarkMode
+                  ? "bg-gray-800 text-gray-300 hover:bg-gray-700"
+                  : "bg-gray-100 text-gray-700 hover:bg-gray-200"
+              }`}
+            >
+              <Menu className="w-5 h-5" />
+            </button>
+          </SheetTrigger>
+          <SheetContent
+            side="left"
+            className={`w-[280px] p-0 border-r ${
+              isDarkMode
+                ? "bg-gray-800 border-gray-700 text-gray-100"
+                : "bg-white border-gray-200 text-gray-900"
+            }`}
+          >
+            <div className="p-3 flex-1 overflow-y-auto flex flex-col h-full">
+              <button
+                onClick={() => {
+                  setMessages([]);
+                  setResults([]);
+                }}
+                className={`w-full flex items-center justify-center gap-2 px-4 py-3 rounded-lg border transition-all text-sm font-medium mb-4 ${
+                  isDarkMode
+                    ? "border-gray-600 hover:bg-gray-700 text-gray-100"
+                    : "border-gray-300 hover:bg-gray-100 text-gray-900"
+                }`}
+              >
+                <span className="text-lg">+</span> New Chat
+              </button>
 
-    {/* Offline Banner */}
-    {!isOnline && (
-      <div className="bg-amber-500/10 border-b border-amber-500/20 px-4 py-2">
-        <p className="text-sm text-center text-amber-700 dark:text-amber-400">
-          🔌 Offline Mode Active - You can query already indexed documents
-        </p>
-      </div>
-    )}
+              <div className="mb-6 flex-1">
+                <div
+                  className={`text-xs font-semibold mb-2 px-2 ${
+                    isDarkMode ? "text-gray-500" : "text-gray-600"
+                  }`}
+                >
+                  Chat History
+                </div>
+                <div className="space-y-1">
+                  {chatHistory.map((chat) => (
+                    <div
+                      key={chat.id}
+                      className={`px-3 py-2 rounded-lg cursor-pointer transition-colors ${
+                        isDarkMode ? "hover:bg-gray-700" : "hover:bg-gray-100"
+                      }`}
+                    >
+                      <div
+                        className={`text-sm truncate ${
+                          isDarkMode ? "text-gray-100" : "text-gray-900"
+                        }`}
+                      >
+                        {chat.title}
+                      </div>
+                      <div
+                        className={`text-xs ${
+                          isDarkMode ? "text-gray-500" : "text-gray-600"
+                        }`}
+                      >
+                        {chat.date}
+                      </div>
+                    </div>
+                  ))}
+                </div>
+              </div>
 
-    {/* Mobile Navigation (same, convenient buttons) */}
-    <div className="fixed bottom-4 left-4 right-4 flex items-center justify-center gap-2 lg:hidden z-50">
-      <Sheet>
-        <SheetTrigger asChild>
-          <button className="flex-1 inline-flex h-12 items-center justify-center rounded-xl bg-primary px-6 text-sm font-medium text-primary-foreground shadow-lg hover:bg-primary/90 transition-all">
-            <FileText className="w-4 h-4 mr-2" />
-            Upload Files
-          </button>
-        </SheetTrigger>
-        <SheetContent side="left" className="w-[300px] sm:w-[400px]">
-          <SheetHeader>
-            <SheetTitle>Upload Documents</SheetTitle>
-          </SheetHeader>
-          <div className="mt-6">
-            <Uploader onUploaded={handleUploadComplete} />
-          </div>
-        </SheetContent>
-      </Sheet>
+              <div className="px-2 mb-4">
+                <div
+                  className={`text-xs font-semibold mb-2 ${
+                    isDarkMode ? "text-gray-500" : "text-gray-600"
+                  }`}
+                >
+                  Database Stats
+                </div>
+                <div
+                  className={`text-sm flex items-center gap-2 px-3 py-2 rounded-lg ${
+                    isDarkMode
+                      ? "bg-gray-700 text-gray-400"
+                      : "bg-gray-100 text-gray-600"
+                  }`}
+                >
+                  <Database className="w-4 h-4" />
+                  {indexedDocs} indexed
+                </div>
+              </div>
 
-      <Sheet>
-        <SheetTrigger asChild>
-          <button className="flex-1 inline-flex h-12 items-center justify-center rounded-xl bg-primary px-6 text-sm font-medium text-primary-foreground shadow-lg hover:bg-primary/90 transition-all">
-            <Database className="w-4 h-4 mr-2" />
-            Context
-          </button>
-        </SheetTrigger>
-        <SheetContent className="w-[300px] sm:w-[400px]">
-          <SheetHeader>
-            <SheetTitle>Retrieved Context</SheetTitle>
-          </SheetHeader>
-          <div className="mt-6">
-            <ContextViewer results={results} onOpen={setModalItem} />
-          </div>
-        </SheetContent>
-      </Sheet>
-    </div>
+              {/* User Area */}
+              <div
+                className={`border-t pt-3 ${
+                  isDarkMode ? "border-gray-700" : "border-gray-200"
+                }`}
+              >
+                <div
+                  className={`flex items-center gap-3 px-3 py-2 rounded-lg cursor-pointer transition-colors ${
+                    isDarkMode ? "hover:bg-gray-700" : "hover:bg-gray-100"
+                  }`}
+                >
+                  <div className="w-8 h-8 rounded-full bg-gradient-to-br from-purple-500 to-pink-500 flex items-center justify-center text-white font-semibold text-sm">
+                    U
+                  </div>
+                  <div className="text-sm font-medium">User</div>
+                </div>
+              </div>
+            </div>
+          </SheetContent>
+        </Sheet>
+      </div>
 
-    {/* Main Layout */}
-    <div className="container mx-auto flex flex-1 gap-4 p-4 pb-24 lg:pb-4 max-w-6xl">
-      {/* Left Panel - Library + Context (ChatGPT ke sidebar jaisa) */}
+      {/* Sidebar (Desktop) */}
       <aside
-        className={`hidden lg:flex w-80 flex-col gap-4 transition-all duration-300 ${
-          showSidebar ? "" : "-ml-80 opacity-0"
+        className={`${
+          showSidebar ? "w-[260px]" : "w-0"
+        } hidden lg:flex flex-col transition-all duration-300 ease-in-out overflow-hidden border-r ${
+          isDarkMode
+            ? "bg-gray-800 text-gray-100 border-gray-700"
+            : "bg-white text-gray-900 border-gray-200"
         }`}
       >
-        {/* Document Library */}
-        <div className="rounded-xl border bg-card text-card-foreground shadow-lg overflow-hidden">
-          <div className="bg-gradient-to-r from-violet-500 to-fuchsia-500 p-4">
-            <h3 className="text-lg font-bold text-white flex items-center gap-2">
-              <FileText className="w-5 h-5" />
-              Document Library
-            </h3>
-            <p className="text-xs text-white/80 mt-1">
-              {indexedDocs} document(s) indexed
-            </p>
-          </div>
-          <div className="p-6">
-            <Uploader onUploaded={handleUploadComplete} />
-          </div>
-        </div>
+        <div className="p-3 flex-1 overflow-y-auto flex flex-col">
+          <button
+            onClick={() => {
+              setMessages([]);
+              setResults([]);
+            }}
+            className={`w-full flex items-center justify-center gap-2 px-4 py-3 rounded-lg border transition-all text-sm font-medium mb-6 ${
+              isDarkMode
+                ? "border-gray-600 hover:bg-gray-700 text-gray-100"
+                : "border-gray-300 hover:bg-gray-100 text-gray-900"
+            }`}
+          >
+            <span className="text-lg">+</span> New Chat
+          </button>
 
-        {/* Retrieved Context (ab left mein hi) */}
-        <div className="rounded-xl border bg-card text-card-foreground shadow-lg overflow-hidden flex-1 min-h-0">
-          <div className="bg-gradient-to-r from-blue-500 to-cyan-500 p-4">
-            <h3 className="text-lg font-bold text-white flex items-center gap-2">
-              <Database className="w-5 h-5" />
-              Retrieved Context
-            </h3>
-            <p className="text-xs text-white/80 mt-1">
-              {results.length} result(s) found
-            </p>
+          <div className="mb-6 flex-1">
+            <div
+              className={`text-xs font-semibold mb-3 px-2 ${
+                isDarkMode ? "text-gray-500" : "text-gray-600"
+              }`}
+            >
+              Chat History
+            </div>
+            <div className="space-y-1">
+              {chatHistory.map((chat) => (
+                <div
+                  key={chat.id}
+                  className={`px-3 py-2 rounded-lg cursor-pointer transition-colors group ${
+                    isDarkMode ? "hover:bg-gray-700" : "hover:bg-gray-100"
+                  }`}
+                >
+                  <div
+                    className={`text-sm truncate ${
+                      isDarkMode ? "text-gray-100" : "text-gray-900"
+                    }`}
+                  >
+                    {chat.title}
+                  </div>
+                  <div
+                    className={`text-xs ${
+                      isDarkMode ? "text-gray-500" : "text-gray-600"
+                    }`}
+                  >
+                    {chat.date}
+                  </div>
+                </div>
+              ))}
+            </div>
           </div>
-          <div className="p-4 max-h-[calc(100vh-16rem)] overflow-y-auto">
-            <ContextViewer results={results} onOpen={setModalItem} />
+
+          <div className="px-2 mb-4">
+            <div
+              className={`text-xs font-semibold mb-2 ${
+                isDarkMode ? "text-gray-500" : "text-gray-600"
+              }`}
+            >
+              Database Stats
+            </div>
+            <div
+              className={`text-sm flex items-center gap-2 px-3 py-2 rounded-lg ${
+                isDarkMode
+                  ? "bg-gray-700 text-gray-400"
+                  : "bg-gray-100 text-gray-600"
+              }`}
+            >
+              <Database className="w-4 h-4" />
+              {indexedDocs} indexed
+            </div>
           </div>
         </div>
       </aside>
 
-      {/* Center Panel - ChatGPT style Chat Interface */}
-      <div className="flex-1 flex justify-center">
-        <div className="w-full max-w-3xl flex flex-col min-w-0">
-          <div className="rounded-xl border bg-card text-card-foreground shadow-lg h-full overflow-hidden flex flex-col">
-            {/* Optional Chat Header (ChatGPT vibe) */}
-            <div className="border-b px-6 py-3 flex items-center justify-between">
-              <div>
-                <h2 className="text-sm font-semibold">Assistant</h2>
-                <p className="text-xs text-muted-foreground">
-                  Multimodal RAG · {isOnline ? "Online" : "Offline mode"}
-                </p>
-              </div>
+        {/* User Area at bottom */}
+        <div
+          className={`p-3 border-t ${
+            isDarkMode ? "border-gray-700" : "border-gray-200"
+          }`}
+        >
+          <div
+            className={`flex items-center gap-3 px-3 py-2 rounded-lg cursor-pointer transition-colors ${
+              isDarkMode ? "hover:bg-gray-700" : "hover:bg-gray-100"
+            }`}
+          >
+            <div className="w-8 h-8 rounded-full bg-gradient-to-br from-purple-500 to-pink-500 flex items-center justify-center text-white font-semibold text-sm">
+              U
             </div>
-
-            <div className="flex-1 min-h-0">
-              <div className="p-6 h-full">
-                <ChatUI
-                  messages={messages}
-                  onSend={handleSend}
-                  isTyping={isTyping}
-                />
-              </div>
+            <div
+              className={`text-sm font-medium ${
+                isDarkMode ? "text-gray-100" : "text-gray-900"
+              }`}
+            >
+              User
             </div>
           </div>
         </div>
-      </div>
-    </div>
+      </aside>
 
-    {/* Toggle Sidebar Button (ab sirf left sidebar ke liye) */}
-    <button
-      onClick={() => setShowSidebar(!showSidebar)}
-      className="hidden lg:flex fixed top-20 left-4 z-50 w-10 h-10 items-center justify-center rounded-full bg-primary text-primary-foreground shadow-lg hover:scale-110 transition-transform"
-    >
-      {showSidebar ? <X className="w-5 h-5" /> : <Menu className="w-5 h-5" />}
-    </button>
+      {/* Main Content Area */}
+      <main
+        className={`flex-1 flex flex-col h-full relative min-w-0 ${
+          isDarkMode ? "bg-gray-900" : "bg-white"
+        }`}
+      >
+        {/* Top Navbar */}
+        <header
+          className={`h-14 flex items-center justify-between px-6 border-b ${
+            isDarkMode
+              ? "border-gray-700 bg-gray-800"
+              : "border-gray-200 bg-white"
+          }`}
+        >
+          <div className="flex items-center gap-3">
+            <button
+              onClick={() => setShowSidebar(!showSidebar)}
+              className={`hidden lg:block p-2 rounded-lg transition-colors ${
+                isDarkMode
+                  ? "text-gray-400 hover:bg-gray-700"
+                  : "text-gray-600 hover:bg-gray-100"
+              }`}
+            >
+              {showSidebar ? (
+                <X className="w-5 h-5" />
+              ) : (
+                <Menu className="w-5 h-5" />
+              )}
+            </button>
+            <h1
+              className={`text-lg font-semibold ${
+                isDarkMode ? "text-gray-100" : "text-gray-900"
+              }`}
+            >
+              Local AI Assistant
+            </h1>
+          </div>
+          <div className="flex items-center gap-4">
+            <button
+              onClick={() => setIsDarkMode(!isDarkMode)}
+              className={`px-3 py-1.5 rounded-full text-sm transition-colors ${
+                isDarkMode
+                  ? "bg-gray-700 text-yellow-400 hover:bg-gray-600"
+                  : "bg-gray-100 text-gray-700 hover:bg-gray-200"
+              }`}
+              title="Toggle dark mode"
+            >
+              {isDarkMode ? "☀️" : "🌙"}
+            </button>
+            <div
+              className={`px-3 py-1.5 rounded-full text-xs font-medium ${
+                isOnline
+                  ? "bg-green-100 text-green-700"
+                  : "bg-gray-100 text-gray-600"
+              }`}
+            >
+              {isOnline ? "● Online" : "○ Offline"}
+            </div>
+          </div>
+        </header>
+
+        {/* Chat Area */}
+        <div
+          className={`flex-1 overflow-hidden relative ${
+            isDarkMode ? "bg-gray-900" : "bg-white"
+          }`}
+        >
+          <ChatUI
+            messages={messages}
+            onSend={handleSend}
+            isTyping={isTyping}
+            onUploadComplete={handleUploadComplete}
+            isDarkMode={isDarkMode}
+          />
+        </div>
+      </main>
 
-    {modalItem && (
-      <SourceModal item={modalItem} onClose={() => setModalItem(null)} />
-    )}
-  </div>
-);
+      {/* Right Sidebar (Context) - Desktop only */}
+      {results.length > 0 && (
+        <aside
+          className={`w-80 border-l hidden xl:flex flex-col ${
+            isDarkMode
+              ? "border-gray-700 bg-gray-800"
+              : "border-gray-200 bg-white"
+          }`}
+        >
+          <div
+            className={`p-4 border-b font-semibold flex items-center justify-between ${
+              isDarkMode ? "border-gray-700" : "border-gray-200"
+            }`}
+          >
+            <span className={isDarkMode ? "text-gray-100" : "text-gray-900"}>
+              Sources
+            </span>
+            <span
+              className={`text-xs px-2 py-1 rounded-full font-medium ${
+                isDarkMode
+                  ? "bg-gray-700 text-gray-300"
+                  : "bg-gray-100 text-gray-600"
+              }`}
+            >
+              {results.length}
+            </span>
+          </div>
+          <div className="flex-1 overflow-y-auto p-4">
+            <ContextViewer
+              results={results}
+              onOpen={setModalItem}
+              isDarkMode={isDarkMode}
+            />
+          </div>
+        </aside>
+      )}
 
 }
 
-export default App;
\ No newline at end of file
+export default App;
diff --git a/frontend/src/ChatUI.jsx b/frontend/src/ChatUI.jsx
index 0b6f365..b7fab4b 100644
--- a/frontend/src/ChatUI.jsx
+++ b/frontend/src/ChatUI.jsx
@@ -1,10 +1,11 @@
 import { useEffect, useRef, useState } from "react";
+import { Mic } from "lucide-react";
 
 export default function ChatUI({ messages, onSend, isTyping = false }) {
   const [input, setInput] = useState("");
   const scrollRef = useRef(null);
 
-  // Simplified submit handler for text-only input
+  // Submit handler
   const submit = (e) => {
     e.preventDefault();
     if (!input.trim()) return;
@@ -12,6 +13,7 @@ export default function ChatUI({ messages, onSend, isTyping = false }) {
     setInput("");
   };
 
+  // Auto-scroll to bottom on new messages
   useEffect(() => {
     if (scrollRef.current) {
       scrollRef.current.scrollTop = scrollRef.current.scrollHeight;
@@ -20,63 +22,85 @@ export default function ChatUI({ messages, onSend, isTyping = false }) {
 
   const Message = ({ role, content }) => {
     const isUser = role === "user";
+    const isSystem = role === "system";
+    
+    if (isSystem) {
+        return (
+            <div className="flex justify-center my-4 px-4">
+                <span className="text-xs text-gray-500 bg-gray-50 px-4 py-2 rounded-full border border-gray-200">
+                    {content}
+                </span>
+            </div>
+        );
+    }
+
     return (
       <div
-        className={`flex items-start gap-3 ${
-          isUser ? "justify-end" : "justify-start"
-        }`}
+        className={`w-full ${
+          isUser ? "bg-white" : "bg-gray-50"
+        } border-b border-gray-100`}
       >
-        {!isUser && (
-          <div className="h-8 w-8 rounded-full bg-gradient-to-br from-violet-500 to-fuchsia-500 flex items-center justify-center text-white shrink-0 shadow-sm">
-            A
+        <div className="flex gap-4 p-6 text-base md:gap-6 md:max-w-3xl lg:max-w-[40rem] xl:max-w-[48rem] mx-auto">
+          <div className="flex-shrink-0 flex flex-col relative items-end">
+            {isUser ? (
+              <div className="h-8 w-8 rounded-full bg-purple-500 flex items-center justify-center text-white font-semibold">
+                U
+              </div>
+            ) : (
+              <div className="h-8 w-8 rounded-full bg-green-500 flex items-center justify-center text-white shadow-sm">
+                <svg width="20" height="20" viewBox="0 0 24 24" fill="none" xmlns="http://www.w3.org/2000/svg">
+                  <path d="M12 2L2 7L12 12L22 7L12 2Z" fill="currentColor" opacity="0.4"/>
+                  <path d="M2 17L12 22L22 17V12L12 17L2 12V17Z" fill="currentColor"/>
+                </svg>
+              </div>
+            )}
           </div>
-        )}
-        <div
-          className={
-            isUser
-              ? "max-w-[80%] sm:max-w-[75%] md:max-w-[70%] rounded-2xl px-4 py-2.5 bg-blue-600 text-white shadow-md animate-in fade-in slide-in-from-right-2 duration-200"
-              : "max-w-[80%] sm:max-w-[75%] md:max-w-[70%] rounded-2xl px-4 py-2.5 bg-white/70 backdrop-blur ring-1 ring-gray-200 shadow-sm animate-in fade-in slide-in-from-left-2 duration-200 dark:bg-neutral-800/70 dark:ring-neutral-700"
-          }
-        >
-          <p className="whitespace-pre-wrap leading-relaxed">{content}</p>
-        </div>
-        {isUser && (
-          <div className="h-8 w-8 rounded-full bg-blue-600 text-white flex items-center justify-center shrink-0 shadow-sm">
-            U
+          
+          <div className="relative flex-1 overflow-hidden">
+              <div className="prose prose-gray max-w-none break-words">
+                  <p className="whitespace-pre-wrap text-gray-900 leading-7">{content}</p>
+              </div>
           </div>
-        )}
+        </div>
       </div>
     );
   };
 
   const Typing = () => (
-    <div className="flex items-center gap-2 text-gray-500">
-      <span
-        className="h-2 w-2 rounded-full bg-gray-400 animate-bounce"
-        style={{ animationDelay: "0ms" }}
-      />
-      <span
-        className="h-2 w-2 rounded-full bg-gray-400 animate-bounce"
-        style={{ animationDelay: "150ms" }}
-      />
-      <span
-        className="h-2 w-2 rounded-full bg-gray-400 animate-bounce"
-        style={{ animationDelay: "300ms" }}
-      />
+    <div className="w-full bg-gray-50 border-b border-gray-100">
+      <div className="flex gap-4 p-6 md:gap-6 md:max-w-3xl lg:max-w-[40rem] xl:max-w-[48rem] mx-auto">
+          <div className="h-8 w-8 rounded-full bg-green-500 flex items-center justify-center text-white shadow-sm">
+              <svg width="20" height="20" viewBox="0 0 24 24" fill="none" xmlns="http://www.w3.org/2000/svg" className="animate-pulse">
+                <path d="M12 2L2 7L12 12L22 7L12 2Z" fill="currentColor" opacity="0.4"/>
+                <path d="M2 17L12 22L22 17V12L12 17L2 12V17Z" fill="currentColor"/>
+              </svg>
+          </div>
+          <div className="flex items-center gap-1">
+              <span className="w-2 h-2 bg-gray-400 rounded-full animate-bounce" style={{ animationDelay: "0ms" }}></span>
+              <span className="w-2 h-2 bg-gray-400 rounded-full animate-bounce" style={{ animationDelay: "150ms" }}></span>
+              <span className="w-2 h-2 bg-gray-400 rounded-full animate-bounce" style={{ animationDelay: "300ms" }}></span>
+          </div>
+      </div>
     </div>
   );
 
   return (
-  <div className="relative flex h-full flex-col overflow-hidden rounded-2xl border bg-background/95 shadow-lg dark:bg-neutral-900/90 dark:border-neutral-800">
-    {/* Messages area */}
-    <div
-      ref={scrollRef}
-      className="relative flex-1 px-4 sm:px-6 py-4 space-y-4 h-[60vh] min-h-[400px] max-h-[700px] overflow-y-auto"
-    >
-      {messages.length === 0 && (
-        <div className="flex h-full flex-col items-center justify-center text-center text-gray-500 dark:text-gray-400">
-          <div className="mx-auto mb-4 flex h-12 w-12 items-center justify-center rounded-full bg-gray-900 text-sm font-semibold text-white dark:bg-neutral-700">
-            AI
+    <div className="flex flex-col h-full relative">
+      {/* Messages Area */}
+      <div
+        ref={scrollRef}
+        className="flex-1 overflow-y-auto w-full"
+      >
+        {messages.length === 0 && (
+          <div className="flex flex-col items-center justify-center h-full text-center px-4">
+            <div className="h-16 w-16 rounded-full bg-gradient-to-br from-purple-500 to-pink-500 shadow-lg flex items-center justify-center mb-6">
+                 <svg width="32" height="32" viewBox="0 0 24 24" fill="none" xmlns="http://www.w3.org/2000/svg" className="text-white">
+                    <path d="M12 2L2 7L12 12L22 7L12 2Z" fill="currentColor" opacity="0.6"/>
+                    <path d="M2 17L12 22L22 17V12L12 17L2 12V17Z" fill="currentColor"/>
+                 </svg>
+            </div>
+            <h2 className="text-3xl font-semibold mb-2 text-gray-900">How can I help you today?</h2>
+            <p className="text-gray-500 text-sm">Ask me anything about your documents</p>
           </div>
           <p className="text-base font-medium">Chat with your documents</p>
           <p className="mt-1 text-xs sm:text-sm text-muted-foreground">
@@ -85,92 +109,50 @@ export default function ChatUI({ messages, onSend, isTyping = false }) {
         </div>
       )}
 
-      {messages.map((m, idx) => {
-        const isUser = m.role === "user";
-
-        return (
-          <div
-            key={idx}
-            className={`flex w-full ${isUser ? "justify-end" : "justify-start"}`}
-          >
-            {/* Assistant avatar */}
-            {!isUser && (
-              <div className="mr-2 mt-1 flex h-8 w-8 shrink-0 items-center justify-center rounded-full bg-emerald-600 text-xs font-semibold text-white">
-                AI
-              </div>
-            )}
-
-            <div className="max-w-[80%] space-y-1">
-              <div
-                className={`inline-block rounded-2xl px-4 py-2 text-sm leading-relaxed ${
-                  isUser
-                    ? "bg-blue-600 text-white rounded-br-sm"
-                    : "bg-gray-100 text-gray-900 dark:bg-neutral-800 dark:text-neutral-50 rounded-bl-sm"
-                }`}
-              >
-                {m.content}
-              </div>
-            </div>
-
-            {/* User avatar */}
-            {isUser && (
-              <div className="ml-2 mt-1 flex h-8 w-8 shrink-0 items-center justify-center rounded-full bg-gray-200 text-xs font-semibold text-gray-800 dark:bg-neutral-700 dark:text-neutral-200">
-                You
-              </div>
-            )}
-          </div>
-        );
-      })}
-
-      {/* Typing indicator (assistant) */}
-      {isTyping && (
-        <div className="flex items-center justify-start gap-3">
-          <div className="mr-2 mt-1 flex h-8 w-8 shrink-0 items-center justify-center rounded-full bg-emerald-600 text-xs font-semibold text-white">
-            AI
-          </div>
-          <div className="rounded-2xl bg-gray-100 px-4 py-2 text-sm dark:bg-neutral-800">
-            <Typing />
-          </div>
+        <div className="flex flex-col pb-32">
+            {messages.map((m, idx) => (
+            <Message key={idx} role={m.role} content={m.content} />
+            ))}
+            {isTyping && <Typing />}
         </div>
-      )}
-    </div>
+      </div>
 
-    {/* Input area – bottom, ChatGPT style */}
-    <div className="border-t bg-background/95 p-3 dark:bg-neutral-900/95 dark:border-neutral-800">
-      <form onSubmit={submit} className="relative">
-        <div className="flex items-end gap-2 rounded-xl border bg-white/90 px-3 py-2 dark:bg-neutral-900/80">
-          <textarea
-            className="max-h-32 min-h-[40px] w-full resize-none bg-transparent text-sm outline-none"
-            placeholder="Message your assistant..."
-            value={input}
-            onChange={(e) => setInput(e.target.value)}
-          />
-          <button
-            type="submit"
-            disabled={!input.trim() || isTyping}
-            className="inline-flex h-9 w-9 items-center justify-center rounded-lg bg-gradient-to-r from-violet-500 to-fuchsia-500 text-[11px] font-medium text-white shadow-sm disabled:cursor-not-allowed disabled:opacity-50"
-            aria-label="Send message"
-          >
-            <svg
-              xmlns="http://www.w3.org/2000/svg"
-              width="18"
-              height="18"
-              viewBox="0 0 24 24"
-              fill="none"
-              stroke="currentColor"
-              strokeWidth="2"
-              strokeLinecap="round"
-              strokeLinejoin="round"
-            >
-              <path d="M5 12h14" />
-              <path d="m12 5 7 7-7 7" />
-            </svg>
-          </button>
+      {/* Input Area */}
+      <div className="absolute bottom-0 left-0 w-full bg-gradient-to-t from-white via-white to-transparent pt-10 pb-6 px-4">
+        <div className="max-w-3xl lg:max-w-[40rem] xl:max-w-[48rem] mx-auto">
+            <form onSubmit={submit} className="relative flex items-center w-full px-4 py-3 bg-white border border-gray-300 rounded-2xl shadow-lg hover:shadow-xl transition-shadow focus-within:border-gray-400">
+                <input
+                    className="w-full max-h-[200px] pr-24 bg-transparent border-none focus:ring-0 resize-none outline-none text-base text-gray-900 placeholder-gray-400"
+                    placeholder="Send a message..."
+                    value={input}
+                    onChange={(e) => setInput(e.target.value)}
+                />
+                <div className="absolute right-3 flex items-center gap-2">
+                  <button
+                      type="button"
+                      className="p-2 rounded-lg text-gray-400 hover:bg-gray-100 transition-colors"
+                      title="Voice input (placeholder)"
+                  >
+                      <Mic className="w-5 h-5" />
+                  </button>
+                  <button
+                      type="submit"
+                      disabled={!input.trim() || isTyping}
+                      className="p-2 rounded-lg bg-green-500 text-white disabled:bg-gray-300 disabled:cursor-not-allowed hover:bg-green-600 transition-colors"
+                  >
+                      <svg width="20" height="20" viewBox="0 0 24 24" fill="none" xmlns="http://www.w3.org/2000/svg">
+                          <path d="M2.01 21L23 12L2.01 3L2 10L17 12L2 14L2.01 21Z" fill="currentColor"/>
+                      </svg>
+                  </button>
+                </div>
+            </form>
+            <div className="text-center mt-3">
+                <p className="text-xs text-gray-400">
+                    AI can make mistakes. Consider checking important information.
+                </p>
+            </div>
         </div>
-        <p className="mt-1 px-1 text-[11px] text-muted-foreground">
-          AI can make mistakes. Consider checking important information.
-        </p>
-      </form>
+      </div>
     </div>
   </div>
 );
diff --git a/frontend/src/ChatWindow.jsx b/frontend/src/ChatWindow.jsx
index f9e02f5..602df88 100644
--- a/frontend/src/ChatWindow.jsx
+++ b/frontend/src/ChatWindow.jsx
@@ -1,7 +1,10 @@
-import { useState } from "react";
+import { useState, useEffect, useRef } from "react";
+import { Send, Mic } from "lucide-react";
 
 export default function ChatWindow({ onQuery, messages, isTyping }) {
   const [input, setInput] = useState("");
+  const scrollRef = useRef(null);
+  const inputRef = useRef(null);
 
   const submit = async (e) => {
     e.preventDefault();
@@ -11,110 +14,167 @@ export default function ChatWindow({ onQuery, messages, isTyping }) {
     await onQuery(text);
   };
 
- return (
-  <div className="relative flex h-full flex-col rounded-2xl border bg-white/90 dark:bg-neutral-900/80 backdrop-blur shadow-sm">
-    {/* Messages area */}
-    <div className="flex-1 overflow-y-auto px-4 py-4 space-y-4">
-      {messages.length === 0 && (
-        <div className="mt-10 text-center text-sm text-muted-foreground">
-          <p className="font-medium">Chat with your documents</p>
-          <p className="text-xs">Ask anything about the files you&apos;ve uploaded…</p>
-        </div>
-      )}
+  // Auto-scroll to bottom on new messages
+  useEffect(() => {
+    if (scrollRef.current) {
+      scrollRef.current.scrollTop = scrollRef.current.scrollHeight;
+    }
+  }, [messages, isTyping]);
+
+  // Auto-grow textarea
+  useEffect(() => {
+    if (inputRef.current) {
+      inputRef.current.style.height = "auto";
+      inputRef.current.style.height = Math.min(inputRef.current.scrollHeight, 150) + "px";
+    }
+  }, [input]);
 
-      {messages.map((m, idx) => {
-        const isUser = m.role === "user";
+  const Message = ({ role, content, sources = [], onOpenSource }) => {
+    const isUser = role === "user";
+    const isSystem = role === "system";
+    
+    if (isSystem) {
+      return (
+        <div className="flex justify-center my-3">
+          <span className="text-xs text-gray-500 bg-gray-50 px-3 py-1.5 rounded-full border border-gray-200">
+            {content}
+          </span>
+        </div>
+      );
+    }
 
-        return (
+    return (
+      <div className={`flex gap-3 mb-4 ${isUser ? "justify-end" : "justify-start"}`}>
+        {!isUser && (
+          <div className="flex-shrink-0 h-8 w-8 rounded-full bg-green-500 flex items-center justify-center text-white shadow-sm">
+            <svg width="18" height="18" viewBox="0 0 24 24" fill="none" xmlns="http://www.w3.org/2000/svg">
+              <path d="M12 2L2 7L12 12L22 7L12 2Z" fill="currentColor" opacity="0.4"/>
+              <path d="M2 17L12 22L22 17V12L12 17L2 12V17Z" fill="currentColor"/>
+            </svg>
+          </div>
+        )}
+        
+        <div className="flex flex-col gap-1 max-w-[75%]">
           <div
-            key={idx}
-            className={`flex w-full ${isUser ? "justify-end" : "justify-start"}`}
+            className={`rounded-2xl px-4 py-2.5 shadow-sm ${
+              isUser
+                ? "bg-purple-500 text-white"
+                : "bg-gray-100 text-gray-900"
+            }`}
           >
-            {/* Assistant avatar */}
-            {!isUser && (
-              <div className="mr-2 mt-1 flex h-7 w-7 shrink-0 items-center justify-center rounded-full bg-emerald-600 text-xs font-semibold text-white">
-                AI
-              </div>
-            )}
-
-            <div className="max-w-[80%] space-y-1">
-              {/* Message bubble */}
-              <div
-                className={`inline-block rounded-2xl px-4 py-2 text-sm leading-relaxed ${
-                  isUser
-                    ? "bg-blue-600 text-white rounded-br-sm"
-                    : "bg-gray-100 text-gray-900 dark:bg-neutral-800 dark:text-neutral-50 rounded-bl-sm"
-                }`}
-              >
-                {m.content}
-              </div>
-
-              {/* Sources (sirf assistant ke niche) */}
-              {!isUser && m.sources && m.sources.length > 0 && (
-                <div className="flex flex-wrap gap-1 text-xs text-gray-600 dark:text-gray-400">
-                  {m.sources.map((s, i) => (
-                    <button
-                      key={i}
-                      onClick={() => m.onOpenSource?.(s)}
-                      className="rounded-full border px-2 py-0.5 hover:bg-gray-100 dark:hover:bg-neutral-700"
-                    >
-                      [{i + 1}] {s.file_name}
-                    </button>
-                  ))}
-                </div>
-              )}
+            <p className="text-sm leading-relaxed whitespace-pre-wrap">{content}</p>
+          </div>
+          
+          {sources && sources.length > 0 && (
+            <div className="flex flex-wrap gap-1 px-2">
+              {sources.map((s, i) => (
+                <button
+                  key={i}
+                  onClick={() => onOpenSource?.(s)}
+                  className="text-xs text-gray-500 hover:text-gray-700 hover:underline"
+                >
+                  [{i + 1}] {s.file_name || s.file}
+                </button>
+              ))}
             </div>
+          )}
+        </div>
 
-            {/* User avatar */}
-            {isUser && (
-              <div className="ml-2 mt-1 flex h-7 w-7 shrink-0 items-center justify-center rounded-full bg-gray-200 text-xs font-semibold text-gray-800 dark:bg-neutral-700 dark:text-neutral-200">
-                You
-              </div>
-            )}
+        {isUser && (
+          <div className="flex-shrink-0 h-8 w-8 rounded-full bg-purple-500 flex items-center justify-center text-white font-semibold text-sm shadow-sm">
+            U
           </div>
-        );
-      })}
+        )}
+      </div>
+    );
+  };
 
-      {/* Typing indicator */}
-      {isTyping && (
-        <div className="flex items-center justify-start gap-2 text-sm text-gray-500">
-          <div className="mr-1 flex h-7 w-7 items-center justify-center rounded-full bg-emerald-600 text-xs font-semibold text-white">
-            AI
-          </div>
-          <div className="flex items-center gap-1 rounded-2xl bg-gray-100 px-3 py-2 text-xs dark:bg-neutral-800">
-            <span className="h-1.5 w-1.5 rounded-full bg-gray-500 animate-bounce" />
-            <span className="h-1.5 w-1.5 rounded-full bg-gray-500 animate-bounce [animation-delay:0.15s]" />
-            <span className="h-1.5 w-1.5 rounded-full bg-gray-500 animate-bounce [animation-delay:0.3s]" />
-          </div>
-        </div>
-      )}
+  const Typing = () => (
+    <div className="flex gap-3 mb-4">
+      <div className="h-8 w-8 rounded-full bg-green-500 flex items-center justify-center text-white shadow-sm">
+        <svg width="18" height="18" viewBox="0 0 24 24" fill="none" xmlns="http://www.w3.org/2000/svg" className="animate-pulse">
+          <path d="M12 2L2 7L12 12L22 7L12 2Z" fill="currentColor" opacity="0.4"/>
+          <path d="M2 17L12 22L22 17V12L12 17L2 12V17Z" fill="currentColor"/>
+        </svg>
+      </div>
+      <div className="flex items-center gap-1 bg-gray-100 rounded-2xl px-4 py-3">
+        <span className="w-1.5 h-1.5 bg-gray-400 rounded-full animate-bounce" style={{ animationDelay: "0ms" }}></span>
+        <span className="w-1.5 h-1.5 bg-gray-400 rounded-full animate-bounce" style={{ animationDelay: "150ms" }}></span>
+        <span className="w-1.5 h-1.5 bg-gray-400 rounded-full animate-bounce" style={{ animationDelay: "300ms" }}></span>
+      </div>
     </div>
+  );
+
+  return (
+    <div className="relative rounded-2xl border border-gray-200 bg-white shadow-lg overflow-hidden flex flex-col h-full max-h-[600px]">
+      {/* Messages Area */}
+      <div 
+        ref={scrollRef}
+        className="flex-1 overflow-y-auto p-4 space-y-2"
+      >
+        {messages.length === 0 && (
+          <div className="flex flex-col items-center justify-center h-full text-center px-4">
+            <div className="h-14 w-14 rounded-full bg-gradient-to-br from-purple-500 to-pink-500 shadow-md flex items-center justify-center mb-4">
+              <svg width="28" height="28" viewBox="0 0 24 24" fill="none" xmlns="http://www.w3.org/2000/svg" className="text-white">
+                <path d="M12 2L2 7L12 12L22 7L12 2Z" fill="currentColor" opacity="0.6"/>
+                <path d="M2 17L12 22L22 17V12L12 17L2 12V17Z" fill="currentColor"/>
+              </svg>
+            </div>
+            <h3 className="text-xl font-semibold mb-1 text-gray-900">Start a conversation</h3>
+            <p className="text-gray-500 text-sm">Ask me anything!</p>
+          </div>
+        )}
 
-    {/* Input area – bottom, ChatGPT style */}
-    <form
-      onSubmit={submit}
-      className="border-t bg-gradient-to-t from-background via-background/80 to-background/40 px-3 py-3"
-    >
-      <div className="flex items-end gap-2 rounded-xl border bg-white/90 px-3 py-2 dark:bg-neutral-900/80">
-        <textarea
-          className="max-h-32 min-h-[40px] w-full resize-none bg-transparent text-sm outline-none"
-          placeholder="Message your assistant..."
-          value={input}
-          onChange={(e) => setInput(e.target.value)}
-        />
-        <button
-          type="submit"
-          disabled={!input.trim()}
-          className="inline-flex h-9 w-9 items-center justify-center rounded-lg bg-gradient-to-r from-violet-500 to-fuchsia-500 text-[11px] font-medium text-white shadow-sm disabled:cursor-not-allowed disabled:opacity-50"
-        >
-          Send
-        </button>
+        {messages.map((m, idx) => (
+          <Message key={idx} {...m} />
+        ))}
+        
+        {isTyping && <Typing />}
       </div>
-      <p className="mt-1 px-1 text-[11px] text-muted-foreground">
-        AI can make mistakes. Check important information.
-      </p>
-    </form>
-  </div>
-);
 
+      {/* Input Form */}
+      <form
+        onSubmit={submit}
+        className="border-t border-gray-200 bg-gray-50 p-3"
+      >
+        <div className="flex items-end gap-2 bg-white border border-gray-300 rounded-xl px-3 py-2 focus-within:border-gray-400 transition-colors shadow-sm">
+          <textarea
+            ref={inputRef}
+            className="flex-1 bg-transparent resize-none outline-none text-sm text-gray-900 placeholder-gray-400 max-h-[150px]"
+            placeholder="Ask a question..."
+            value={input}
+            onChange={(e) => setInput(e.target.value)}
+            onKeyDown={(e) => {
+              if (e.key === "Enter" && !e.shiftKey) {
+                e.preventDefault();
+                submit(e);
+              }
+            }}
+            rows={1}
+          />
+          <div className="flex items-center gap-1">
+            <button
+              type="button"
+              onClick={() => alert("Voice input coming soon!")}
+              className="p-1.5 rounded-lg text-gray-400 hover:bg-gray-100 transition-colors"
+              title="Voice input"
+            >
+              <Mic className="w-4 h-4" />
+            </button>
+            <button
+              type="submit"
+              disabled={!input.trim() || isTyping}
+              className="p-1.5 rounded-lg bg-green-500 text-white hover:bg-green-600 disabled:bg-gray-300 disabled:cursor-not-allowed transition-colors"
+              title="Send message"
+            >
+              <Send className="w-4 h-4" />
+            </button>
+          </div>
+        </div>
+        <p className="text-xs text-gray-400 text-center mt-2">
+          Press Enter to send, Shift+Enter for new line
+        </p>
+      </form>
+    </div>
+  );
 }
diff --git a/frontend/src/components/ChatUI.jsx b/frontend/src/components/ChatUI.jsx
index 9a23fa0..ed8d377 100644
--- a/frontend/src/components/ChatUI.jsx
+++ b/frontend/src/components/ChatUI.jsx
@@ -1,11 +1,12 @@
-import { Mic, Send, Loader2 } from "lucide-react";
+import { Mic, Send, Paperclip, X } from "lucide-react";
 import { useEffect, useRef, useState } from "react";
+import Uploader from "../Uploader";
 
 function CitationNumber({ number, onClick }) {
   return (
     <button
       onClick={onClick}
-      className="inline-flex h-4 w-4 items-center justify-center rounded-full bg-primary text-[10px] font-medium text-primary-foreground hover:bg-primary/90"
+      className="inline-flex h-5 w-5 items-center justify-center rounded-full bg-gray-500 text-[10px] font-medium text-white hover:bg-gray-600 transition-colors"
     >
       {number}
     </button>
@@ -14,102 +15,129 @@ function CitationNumber({ number, onClick }) {
 
 function ChatMessage({ role, content, sources = [], onOpenSource }) {
   const isUser = role === "user";
+  const isSystem = role === "system";
   const hasSourceCitations = sources && sources.length > 0;
 
+  if (isSystem) {
+    return (
+      <div className="flex justify-center my-4 px-4">
+        <span className="text-xs text-gray-500 bg-gray-50 px-4 py-2 rounded-full border border-gray-200">
+          {content}
+        </span>
+      </div>
+    );
+  }
+
   return (
     <div
-      className={`group flex items-start gap-3 ${
-        isUser ? "justify-end" : "justify-start"
-      }`}
+      className={`w-full ${
+        isUser ? "bg-white" : "bg-gray-50"
+      } border-b border-gray-100`}
     >
-      {!isUser && (
-        <div className="h-8 w-8 overflow-hidden rounded-full bg-gradient-to-br from-violet-500 to-fuchsia-500 ring-2 ring-background">
-          <div className="flex h-full w-full items-center justify-center text-white font-semibold">
-            A
-          </div>
-        </div>
-      )}
-      <div className="flex flex-col gap-1">
-        <div
-          className={`max-w-[85%] rounded-2xl px-4 py-2.5 shadow-sm transition-colors ${
-            isUser
-              ? "bg-primary text-primary-foreground"
-              : "bg-muted text-foreground"
-          }`}
-        >
-          <p className="whitespace-pre-wrap text-sm leading-relaxed">
-            {content}
-            {hasSourceCitations && (
-              <span className="ml-1 space-x-1">
-                {sources.map((source, i) => (
-                  <CitationNumber
-                    key={i}
-                    number={i + 1}
-                    onClick={() => {
-                      // Prefer direct URL when available for instant open
-                      if (source?.url) {
-                        window.open(
-                          source.url.startsWith("http")
-                            ? source.url
-                            : `http://localhost:8000${source.url}`,
-                          "_blank"
-                        );
-                      } else {
-                        onOpenSource?.(source);
-                      }
-                    }}
-                  />
-                ))}
-              </span>
-            )}
-          </p>
-        </div>
-        {hasSourceCitations && (
-          <div
-            className="invisible flex gap-2 px-4 text-xs text-muted-foreground group-hover:visible"
-            aria-label="Click numbers above to view sources"
-          >
-            {sources.map((source, i) => (
-              <button
-                key={i}
-                onClick={() => onOpenSource?.(source)}
-                className="hover:text-foreground"
+      <div className="flex gap-4 p-6 text-base md:gap-6 md:max-w-3xl lg:max-w-[40rem] xl:max-w-[48rem] mx-auto">
+        <div className="flex-shrink-0">
+          {isUser ? (
+            <div className="h-8 w-8 rounded-full bg-purple-500 flex items-center justify-center text-white font-semibold">
+              U
+            </div>
+          ) : (
+            <div className="h-8 w-8 rounded-full bg-green-500 flex items-center justify-center text-white shadow-sm">
+              <svg
+                width="20"
+                height="20"
+                viewBox="0 0 24 24"
+                fill="none"
+                xmlns="http://www.w3.org/2000/svg"
               >
-                [{i + 1}] {source.title || source.file}
-              </button>
-            ))}
-          </div>
-        )}
-      </div>
-      {isUser && (
-        <div className="h-8 w-8 overflow-hidden rounded-full bg-primary ring-2 ring-background">
-          <div className="flex h-full w-full items-center justify-center text-primary-foreground font-semibold">
-            U
+                <path
+                  d="M12 2L2 7L12 12L22 7L12 2Z"
+                  fill="currentColor"
+                  opacity="0.4"
+                />
+                <path
+                  d="M2 17L12 22L22 17V12L12 17L2 12V17Z"
+                  fill="currentColor"
+                />
+              </svg>
+            </div>
+          )}
+        </div>
+
+        <div className="flex flex-col gap-2 flex-1">
+          <div>
+            <p className="whitespace-pre-wrap text-gray-900 leading-7">
+              {content}
+              {hasSourceCitations && (
+                <span className="ml-2 space-x-1">
+                  {sources.map((source, i) => (
+                    <CitationNumber
+                      key={i}
+                      number={i + 1}
+                      onClick={() => {
+                        // Prefer direct URL when available for instant open
+                        if (source?.url) {
+                          window.open(
+                            source.url.startsWith("http")
+                              ? source.url
+                              : `http://localhost:8000${source.url}`,
+                            "_blank"
+                          );
+                        } else {
+                          onOpenSource?.(source);
+                        }
+                      }}
+                    />
+                  ))}
+                </span>
+              )}
+            </p>
           </div>
+
+          {hasSourceCitations && (
+            <div className="flex flex-wrap gap-2 text-xs text-gray-500">
+              {sources.map((source, i) => (
+                <button
+                  key={i}
+                  onClick={() => onOpenSource?.(source)}
+                  className="hover:text-gray-700 hover:underline"
+                >
+                  [{i + 1}] {source.file_name || source.title || source.file}
+                </button>
+              ))}
+            </div>
+          )}
         </div>
-      )}
+      </div>
     </div>
   );
 }
 
-export default function ChatUI({ messages, onSend, isTyping = false }) {
+export default function ChatUI({
+  messages,
+  onSend,
+  isTyping = false,
+  onUploadComplete,
+  isDarkMode = false,
+}) {
   const [input, setInput] = useState("");
-  const [isRecording, setIsRecording] = useState(false);
+  const [showUploader, setShowUploader] = useState(false);
+  const [isFocused, setIsFocused] = useState(false);
   const scrollRef = useRef(null);
   const inputRef = useRef(null);
 
+  const MAX_CHARS = 4000;
+  const charCount = input.length;
+  const isNearLimit = charCount > MAX_CHARS * 0.8;
+  const isOverLimit = charCount > MAX_CHARS;
+
   // Submit handler for text input
   const submit = (e) => {
     e.preventDefault();
-    if (!input.trim()) return;
+    if (!input.trim() || isOverLimit) return;
     onSend(input.trim());
     setInput("");
-  };
-
-  // Handle voice input (placeholder)
-  const toggleVoiceInput = () => {
-    // TODO: Implement voice recording
-    setIsRecording(!isRecording);
+    // Re-focus input after sending
+    setTimeout(() => inputRef.current?.focus(), 100);
   };
 
   // Auto-scroll to bottom
@@ -126,65 +154,295 @@ export default function ChatUI({ messages, onSend, isTyping = false }) {
   useEffect(() => {
     if (inputRef.current) {
       inputRef.current.style.height = "auto";
-      inputRef.current.style.height = inputRef.current.scrollHeight + "px";
+      inputRef.current.style.height =
+        Math.min(inputRef.current.scrollHeight, 200) + "px";
     }
   }, [input]);
 
+  // Dynamic placeholder based on context
+  const getPlaceholder = () => {
+    if (isTyping) return "Wait for response...";
+    if (messages.length === 0) return "Ask me anything about your documents...";
+    return "Send a message...";
+  };
+
+  const Typing = () => (
+    <div
+      className={`w-full border-b ${
+        isDarkMode
+          ? "bg-gray-800 border-gray-700"
+          : "bg-gray-50 border-gray-100"
+      }`}
+    >
+      <div className="flex gap-4 p-6 md:gap-6 md:max-w-3xl lg:max-w-[40rem] xl:max-w-[48rem] mx-auto">
+        <div className="h-8 w-8 rounded-full bg-green-500 flex items-center justify-center text-white shadow-sm">
+          <svg
+            width="20"
+            height="20"
+            viewBox="0 0 24 24"
+            fill="none"
+            xmlns="http://www.w3.org/2000/svg"
+            className="animate-pulse"
+          >
+            <path
+              d="M12 2L2 7L12 12L22 7L12 2Z"
+              fill="currentColor"
+              opacity="0.4"
+            />
+            <path d="M2 17L12 22L22 17V12L12 17L2 12V17Z" fill="currentColor" />
+          </svg>
+        </div>
+        <div className="flex items-center gap-1">
+          <span
+            className={`w-2 h-2 rounded-full animate-bounce ${
+              isDarkMode ? "bg-gray-500" : "bg-gray-400"
+            }`}
+            style={{ animationDelay: "0ms" }}
+          ></span>
+          <span
+            className={`w-2 h-2 rounded-full animate-bounce ${
+              isDarkMode ? "bg-gray-500" : "bg-gray-400"
+            }`}
+            style={{ animationDelay: "150ms" }}
+          ></span>
+          <span
+            className={`w-2 h-2 rounded-full animate-bounce ${
+              isDarkMode ? "bg-gray-500" : "bg-gray-400"
+            }`}
+            style={{ animationDelay: "300ms" }}
+          ></span>
+        </div>
+      </div>
+    </div>
+  );
+
   return (
-    <div className="flex h-full flex-col overflow-hidden rounded-lg bg-card text-card-foreground">
+    <div
+      className={`flex h-full flex-col overflow-hidden ${
+        isDarkMode ? "bg-gray-900" : "bg-white"
+      }`}
+    >
       {/* Message List */}
-      <div
-        ref={scrollRef}
-        className="flex-1 space-y-4 overflow-y-auto p-4 scroll-smooth"
-      >
-        {messages.map((msg, i) => (
-          <ChatMessage key={i} {...msg} />
-        ))}
-        {isTyping && (
-          <div className="flex items-center gap-2 text-muted-foreground">
-            <Loader2 className="h-4 w-4 animate-spin" />
-            <span className="text-sm">AI is thinking...</span>
+      <div ref={scrollRef} className="flex-1 overflow-y-auto w-full">
+        {messages.length === 0 && (
+          <div
+            className={`flex flex-col items-center justify-center h-full text-center px-4 ${
+              isDarkMode ? "bg-gray-900" : "bg-white"
+            }`}
+          >
+            <div className="h-16 w-16 rounded-full bg-gradient-to-br from-purple-500 to-pink-500 shadow-lg flex items-center justify-center mb-6">
+              <svg
+                width="32"
+                height="32"
+                viewBox="0 0 24 24"
+                fill="none"
+                xmlns="http://www.w3.org/2000/svg"
+                className="text-white"
+              >
+                <path
+                  d="M12 2L2 7L12 12L22 7L12 2Z"
+                  fill="currentColor"
+                  opacity="0.6"
+                />
+                <path
+                  d="M2 17L12 22L22 17V12L12 17L2 12V17Z"
+                  fill="currentColor"
+                />
+              </svg>
+            </div>
+            <h2
+              className={`text-3xl font-semibold mb-2 ${
+                isDarkMode ? "text-gray-100" : "text-gray-900"
+              }`}
+            >
+              How can I help you today?
+            </h2>
+            <p
+              className={
+                isDarkMode ? "text-gray-400 text-sm" : "text-gray-500 text-sm"
+              }
+            >
+              Ask me anything about your documents
+            </p>
           </div>
         )}
+
+        <div className="flex flex-col pb-32">
+          {messages.map((msg, i) => (
+            <ChatMessage key={i} {...msg} />
+          ))}
+          {isTyping && <Typing />}
+        </div>
       </div>
 
+      {/* Upload Modal */}
+      {showUploader && (
+        <div className="absolute inset-0 bg-black/50 flex items-center justify-center z-50 p-4">
+          <div
+            className={`rounded-2xl shadow-2xl w-full max-w-2xl max-h-[80vh] overflow-y-auto ${
+              isDarkMode ? "bg-gray-800" : "bg-white"
+            }`}
+          >
+            <div
+              className={`sticky top-0 border-b p-4 flex items-center justify-between rounded-t-2xl ${
+                isDarkMode
+                  ? "bg-gray-800 border-gray-700"
+                  : "bg-white border-gray-200"
+              }`}
+            >
+              <h3
+                className={`text-lg font-semibold ${
+                  isDarkMode ? "text-gray-100" : "text-gray-900"
+                }`}
+              >
+                Upload Documents
+              </h3>
+              <button
+                onClick={() => setShowUploader(false)}
+                className={`p-2 rounded-lg transition-colors ${
+                  isDarkMode ? "hover:bg-gray-700" : "hover:bg-gray-100"
+                }`}
+              >
+                <X
+                  className={`w-5 h-5 ${
+                    isDarkMode ? "text-gray-400" : "text-gray-500"
+                  }`}
+                />
+              </button>
+            </div>
+            <div className="p-6">
+              <Uploader
+                onUploaded={(data) => {
+                  if (onUploadComplete) onUploadComplete(data);
+                  setShowUploader(false);
+                }}
+              />
+            </div>
+          </div>
+        </div>
+      )}
+
       {/* Input Form */}
-      <form onSubmit={submit} className="border-t p-4">
-        <div className="flex gap-2">
-          <div className="relative flex-1">
+      <div
+        className={`absolute bottom-0 left-0 w-full bg-gradient-to-t pt-10 pb-6 px-4 ${
+          isDarkMode
+            ? "from-gray-900 via-gray-900 to-transparent"
+            : "from-white via-white to-transparent"
+        }`}
+      >
+        <div className="max-w-3xl lg:max-w-[40rem] xl:max-w-[48rem] mx-auto">
+          <form
+            onSubmit={submit}
+            className={`relative flex items-end w-full rounded-3xl shadow-sm transition-all duration-300 py-2 ${
+              isFocused
+                ? `border-2 border-blue-500 shadow-lg ring-2 ring-blue-100 ${
+                    isDarkMode ? "bg-gray-800" : "bg-white"
+                  }`
+                : `${
+                    isDarkMode
+                      ? "bg-gray-800 border-gray-700 hover:border-gray-600 hover:shadow-md"
+                      : "bg-white border border-gray-300 hover:border-gray-400 hover:shadow-md"
+                  }`
+            }`}
+          >
+            <button
+              type="button"
+              onClick={() => setShowUploader(true)}
+              className={`p-2 ml-1 rounded-lg transition-all duration-200 transform hover:scale-110 mr-2 ${
+                isDarkMode
+                  ? "text-gray-400 hover:bg-gray-700 hover:text-green-400"
+                  : "text-gray-400 hover:bg-gray-100 hover:text-green-500"
+              }`}
+              title="Upload documents"
+              disabled={isTyping}
+            >
+              <Paperclip className="w-5 h-5" />
+            </button>
             <textarea
               ref={inputRef}
               value={input}
               onChange={(e) => setInput(e.target.value)}
+              onFocus={() => setIsFocused(true)}
+              onBlur={() => setIsFocused(false)}
               onKeyDown={(e) => {
                 if (e.key === "Enter" && !e.shiftKey) {
                   e.preventDefault();
                   submit(e);
                 }
               }}
-              placeholder="Type a message..."
-              className="min-h-[44px] w-full resize-none rounded-md border bg-background px-3 py-2 text-sm ring-offset-background placeholder:text-muted-foreground focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-ring focus-visible:ring-offset-2"
-              style={{ maxHeight: "200px" }}
+              placeholder={getPlaceholder()}
+              disabled={isTyping}
+              className={`w-full max-h-[200px] pr-24 bg-transparent border-none focus:ring-0 focus:outline-none outline-none resize-none text-base transition-all duration-200 ${
+                isDarkMode
+                  ? "placeholder-gray-500 text-gray-100"
+                  : "placeholder-gray-400 text-gray-900"
+              } ${isTyping ? "text-gray-400 cursor-not-allowed" : ""} ${
+                isOverLimit ? "text-red-600" : ""
+              }`}
+              rows={1}
             />
+            <div className="absolute right-3 bottom-3 flex items-center gap-2">
+              {/* Character Counter */}
+              {charCount > 0 && (
+                <div
+                  className={`text-xs font-medium transition-all duration-200 ${
+                    isOverLimit
+                      ? "text-red-500 animate-pulse"
+                      : isNearLimit
+                      ? "text-orange-500"
+                      : "text-gray-400"
+                  }`}
+                >
+                  {charCount}/{MAX_CHARS}
+                </div>
+              )}
+
+              <button
+                type="button"
+                onClick={() => alert("Voice input coming soon!")}
+                className={`p-2 rounded-lg transition-all duration-200 transform hover:scale-110 ${
+                  isDarkMode
+                    ? "text-gray-400 hover:bg-gray-700 hover:text-green-400"
+                    : "text-gray-400 hover:bg-gray-100 hover:text-green-500"
+                }`}
+                title="Voice input (placeholder)"
+                disabled={isTyping}
+              >
+                <Mic className="w-5 h-5" />
+              </button>
+              <button
+                type="submit"
+                disabled={!input.trim() || isTyping || isOverLimit}
+                className={`p-2 rounded-lg transition-all duration-200 transform ${
+                  !input.trim() || isTyping || isOverLimit
+                    ? "bg-gray-300 text-gray-500 cursor-not-allowed scale-95"
+                    : "bg-green-500 text-white hover:bg-green-600 hover:scale-110 shadow-md hover:shadow-lg"
+                }`}
+              >
+                <Send
+                  className={`w-5 h-5 transition-transform duration-200 ${
+                    input.trim() && !isTyping && !isOverLimit
+                      ? "translate-x-0"
+                      : ""
+                  }`}
+                />
+              </button>
+            </div>
+          </form>
+          <div className="text-center mt-3 flex items-center justify-center gap-2">
+            <p className="text-xs text-gray-400">
+              AI can make mistakes. Consider checking important information.
+            </p>
+            {/* Status indicator */}
+            {isTyping && (
+              <span className="inline-flex items-center gap-1 text-xs text-green-500 font-medium">
+                <span className="w-1.5 h-1.5 bg-green-500 rounded-full animate-pulse"></span>
+                Thinking...
+              </span>
+            )}
           </div>
-          <button
-            type="button"
-            onClick={toggleVoiceInput}
-            className={`inline-flex h-11 w-11 items-center justify-center whitespace-nowrap rounded-md ring-offset-background transition-colors hover:bg-muted focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-ring focus-visible:ring-offset-2 ${
-              isRecording ? "bg-red-500 text-white hover:bg-red-600" : ""
-            }`}
-          >
-            <Mic className="h-5 w-5" />
-          </button>
-          <button
-            type="submit"
-            disabled={!input.trim()}
-            className="inline-flex h-11 w-11 items-center justify-center whitespace-nowrap rounded-md bg-primary text-primary-foreground ring-offset-background transition-colors hover:bg-primary/90 focus-visible:outline-none focus-visible:ring-2 focus-visible:ring-ring focus-visible:ring-offset-2 disabled:pointer-events-none disabled:opacity-50"
-          >
-            <Send className="h-5 w-5" />
-          </button>
         </div>
-      </form>
+      </div>
     </div>
   );
 }
diff --git a/frontend/src/components/ContextViewer.jsx b/frontend/src/components/ContextViewer.jsx
index b679ec2..0391e17 100644
--- a/frontend/src/components/ContextViewer.jsx
+++ b/frontend/src/components/ContextViewer.jsx
@@ -27,7 +27,9 @@ function TextResult({ result, onOpen }) {
       onClick={() => {
         if (result?.url) {
           window.open(
-            result.url.startsWith("http") ? result.url : `http://localhost:8000${result.url}`,
+            result.url.startsWith("http")
+              ? result.url
+              : `http://localhost:8000${result.url}`,
             "_blank"
           );
         } else {
@@ -61,7 +63,9 @@ function ImageResult({ result, onOpen }) {
       onClick={() => {
         if (result?.url) {
           window.open(
-            result.url.startsWith("http") ? result.url : `http://localhost:8000${result.url}`,
+            result.url.startsWith("http")
+              ? result.url
+              : `http://localhost:8000${result.url}`,
             "_blank"
           );
         } else {
@@ -115,7 +119,7 @@ function AudioResult({ result, onOpen }) {
   );
 }
 
-export default function ContextViewer({ results, onOpen }) {
+export default function ContextViewer({ results, onOpen, isDarkMode = false }) {
   // Filter results by type
   const textResults = results.filter(
     (r) => r.type === "text" || (!r.type && r.text)
diff --git a/frontend/src/styles.css b/frontend/src/styles.css
index 1d38a02..a5c0866 100644
--- a/frontend/src/styles.css
+++ b/frontend/src/styles.css
@@ -22,30 +22,30 @@
     --destructive-foreground: 0 0% 98%;
     --border: 240 5.9% 90%;
     --input: 240 5.9% 90%;
-    --ring: 240 5.9% 10%;
-    --radius: 0.75rem;
+    --ring: 240 10% 3.9%;
+    --radius: 0.5rem;
   }
 
   .dark {
-    --background: 240 10% 3.9%;
-    --foreground: 0 0% 98%;
-    --card: 240 10% 3.9%;
-    --card-foreground: 0 0% 98%;
-    --popover: 240 10% 3.9%;
-    --popover-foreground: 0 0% 98%;
-    --primary: 0 0% 98%;
-    --primary-foreground: 240 5.9% 10%;
-    --secondary: 240 3.7% 15.9%;
-    --secondary-foreground: 0 0% 98%;
-    --muted: 240 3.7% 15.9%;
-    --muted-foreground: 240 5% 64.9%;
-    --accent: 240 3.7% 15.9%;
-    --accent-foreground: 0 0% 98%;
+    --background: 222 13% 23%;
+    --foreground: 225 6% 93%;
+    --card: 222 13% 23%;
+    --card-foreground: 225 6% 93%;
+    --popover: 220 13% 14%;
+    --popover-foreground: 225 6% 93%;
+    --primary: 225 6% 93%;
+    --primary-foreground: 220 13% 14%;
+    --secondary: 220 13% 14%;
+    --secondary-foreground: 225 6% 93%;
+    --muted: 223 10% 28%;
+    --muted-foreground: 215 8% 65%;
+    --accent: 220 13% 14%;
+    --accent-foreground: 225 6% 93%;
     --destructive: 0 62.8% 30.6%;
     --destructive-foreground: 0 0% 98%;
-    --border: 240 3.7% 15.9%;
-    --input: 240 3.7% 15.9%;
-    --ring: 240 4.9% 83.9%;
+    --border: 215 14% 34%;
+    --input: 217 10% 28%;
+    --ring: 215 14% 34%;
   }
 }
 
@@ -53,9 +53,44 @@ html,
 body,
 #root {
   height: 100%;
+  margin: 0;
+  padding: 0;
+  font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", "Roboto", "Oxygen",
+    "Ubuntu", "Cantarell", "Fira Sans", "Droid Sans", "Helvetica Neue",
+    sans-serif;
+  -webkit-font-smoothing: antialiased;
+  -moz-osx-font-smoothing: grayscale;
 }
 
-/* Your keyframes animations can remain as they are */
+* {
+  box-sizing: border-box;
+}
+
+/* Smooth scrolling */
+html {
+  scroll-behavior: smooth;
+}
+
+/* Custom scrollbar for webkit browsers */
+::-webkit-scrollbar {
+  width: 8px;
+  height: 8px;
+}
+
+::-webkit-scrollbar-track {
+  background: transparent;
+}
+
+::-webkit-scrollbar-thumb {
+  background: #d1d5db;
+  border-radius: 4px;
+}
+
+::-webkit-scrollbar-thumb:hover {
+  background: #9ca3af;
+}
+
+/* Animations */
 @keyframes float {
   0% {
     transform: translateY(0px);
@@ -68,10 +103,144 @@ body,
   }
 }
 
+@keyframes fadeIn {
+  from {
+    opacity: 0;
+    transform: translateY(10px);
+  }
+  to {
+    opacity: 1;
+    transform: translateY(0);
+  }
+}
+
+@keyframes slideInLeft {
+  from {
+    opacity: 0;
+    transform: translateX(-20px);
+  }
+  to {
+    opacity: 1;
+    transform: translateX(0);
+  }
+}
+
+@keyframes slideInRight {
+  from {
+    opacity: 0;
+    transform: translateX(20px);
+  }
+  to {
+    opacity: 1;
+    transform: translateX(0);
+  }
+}
+
 .animate-in {
-  animation-duration: 180ms;
-  animation-timing-function: cubic-bezier(0.16, 1, 0.3, 1);
-  animation-fill-mode: both;
+  animation: fadeIn 0.3s cubic-bezier(0.16, 1, 0.3, 1);
+}
+
+.animate-slide-left {
+  animation: slideInLeft 0.3s cubic-bezier(0.16, 1, 0.3, 1);
+}
+
+.animate-slide-right {
+  animation: slideInRight 0.3s cubic-bezier(0.16, 1, 0.3, 1);
+}
+
+/* Smooth transitions for all interactive elements */
+button,
+a,
+input,
+textarea {
+  transition: all 0.2s cubic-bezier(0.16, 1, 0.3, 1);
+}
+
+/* Focus styles */
+button:focus-visible,
+a:focus-visible,
+input:focus-visible,
+textarea:focus-visible {
+  outline: 2px solid #3b82f6;
+  outline-offset: 2px;
+}
+
+/* Prose styling for markdown content */
+.prose {
+  color: #1f2937;
+  max-width: 100%;
+}
+
+.prose p {
+  margin-top: 0;
+  margin-bottom: 0;
+  line-height: 1.75;
+}
+
+.prose strong {
+  font-weight: 600;
+  color: #111827;
+}
+
+.prose code {
+  background: #f3f4f6;
+  padding: 0.2em 0.4em;
+  border-radius: 0.25rem;
+  font-size: 0.875em;
+  font-family: 'Consolas', 'Monaco', 'Courier New', monospace;
+}
+
+.prose pre {
+  background: #1f2937;
+  color: #f9fafb;
+  padding: 1rem;
+  border-radius: 0.5rem;
+  overflow-x: auto;
+  font-size: 0.875em;
+}
+
+.prose pre code {
+  background: transparent;
+  padding: 0;
+  color: inherit;
+}
+
+.prose ul,
+.prose ol {
+  padding-left: 1.5em;
+  margin-top: 0.5em;
+  margin-bottom: 0.5em;
 }
 
-/* ... rest of your existing css ... */
+.prose li {
+  margin-top: 0.25em;
+  margin-bottom: 0.25em;
+}
+
+/* Loading states */
+@keyframes pulse {
+  0%, 100% {
+    opacity: 1;
+  }
+  50% {
+    opacity: 0.5;
+  }
+}
+
+.animate-pulse {
+  animation: pulse 2s cubic-bezier(0.4, 0, 0.6, 1) infinite;
+}
+
+/* Bounce animation for typing indicator */
+@keyframes bounce {
+  0%, 100% {
+    transform: translateY(0);
+  }
+  50% {
+    transform: translateY(-6px);
+  }
+}
+
+.animate-bounce {
+  animation: bounce 1s infinite;
+}
diff --git a/scripts/check_audio_deps.py b/scripts/check_audio_deps.py
new file mode 100644
index 0000000..7dedd8b
--- /dev/null
+++ b/scripts/check_audio_deps.py
@@ -0,0 +1,35 @@
+import sys
+import subprocess
+
+def check_whisper():
+    print("Checking openai-whisper...")
+    try:
+        import whisper
+        print("✅ openai-whisper is installed.")
+    except ImportError:
+        print("❌ openai-whisper is NOT installed.")
+        return False
+    return True
+
+def check_ffmpeg():
+    print("Checking ffmpeg...")
+    try:
+        # Try running ffmpeg -version
+        subprocess.run(["ffmpeg", "-version"], stdout=subprocess.PIPE, stderr=subprocess.PIPE, check=True)
+        print("✅ ffmpeg is available in PATH.")
+    except FileNotFoundError:
+        print("❌ ffmpeg is NOT found in PATH. Whisper requires ffmpeg.")
+        return False
+    except Exception as e:
+        print(f"❌ Error checking ffmpeg: {e}")
+        return False
+    return True
+
+if __name__ == "__main__":
+    w = check_whisper()
+    f = check_ffmpeg()
+    
+    if w and f:
+        print("\n🎉 All audio dependencies look good!")
+    else:
+        print("\n⚠️ Some dependencies are missing. Audio transcription might not work.")
diff --git a/tests/test_audio.py b/tests/test_audio.py
new file mode 100644
index 0000000..149a60d
--- /dev/null
+++ b/tests/test_audio.py
@@ -0,0 +1,24 @@
+import os
+from backend.app.ingestion.audio_transcriber import transcribe_audio
+
+
+def test_transcribe_sanity():
+    # Create a small temporary wav file
+    import wave, struct
+    tmp = os.path.join(os.path.dirname(__file__), 'tmp_test_silent.wav')
+    with wave.open(tmp, 'w') as wf:
+        wf.setnchannels(1)
+        wf.setsampwidth(2)
+        wf.setframerate(16000)
+        frames = (struct.pack('<h', 0) for _ in range(16000))
+        wf.writeframes(b''.join(frames))
+
+    chunks = transcribe_audio(tmp, 'tmp_test_silent.wav')
+    assert isinstance(chunks, list)
+    assert len(chunks) >= 1
+    # Each chunk should have content and file_type audio
+    for c in chunks:
+        assert hasattr(c, 'content')
+        assert c.file_type == 'audio'
+
+    os.remove(tmp)