diff --git a/backends/advanced/.env.template b/backends/advanced/.env.template
index 9c11af67..752f140c 100644
--- a/backends/advanced/.env.template
+++ b/backends/advanced/.env.template
@@ -165,6 +165,13 @@ DEBUG_DIR=./data/debug_dir
 # HF_TOKEN=
 # SPEAKER_SERVICE_URL=http://speaker-recognition:8001
 
+# Speaker recognition chunking configuration (for large files)
+# Files longer than SPEAKER_CHUNK_THRESHOLD will be split into smaller segments
+# for processing to avoid memory issues
+SPEAKER_CHUNK_THRESHOLD=1500  # 25 minutes - chunk files larger than this (seconds)
+SPEAKER_CHUNK_SIZE=900         # 15 minutes - size of each chunk (seconds)
+SPEAKER_CHUNK_OVERLAP=30       # 30 seconds - overlap between chunks for continuity
+
 # Audio processing settings
 # NEW_CONVERSATION_TIMEOUT_MINUTES=1.5
 # AUDIO_CROPPING_ENABLED=true
diff --git a/backends/advanced/Docs/memories.md b/backends/advanced/Docs/memories.md
index cae98383..08ae393e 100644
--- a/backends/advanced/Docs/memories.md
+++ b/backends/advanced/Docs/memories.md
@@ -98,7 +98,7 @@ MEM0_CONFIG = {
     "vector_store": {
         "provider": "qdrant",
         "config": {
-            "collection_name": "omi_memories",
+            "collection_name": "chronicle_memories",
             "embedding_model_dims": 768,
             "host": QDRANT_BASE_URL,
             "port": 6333,
@@ -499,7 +499,7 @@ This will:
 3. **Search Not Working**
    - Ensure embedding model is available in Ollama
    - Check vector dimensions match between embedder and Qdrant
-   - Verify collection has vectors: `curl http://localhost:6333/collections/omi_memories`
+   - Verify collection has vectors: `curl http://localhost:6333/collections/chronicle_memories`
 
 ### Required Ollama Models
 
diff --git a/backends/advanced/docker-compose-test.yml b/backends/advanced/docker-compose-test.yml
index 25e7da88..43a7f3b7 100644
--- a/backends/advanced/docker-compose-test.yml
+++ b/backends/advanced/docker-compose-test.yml
@@ -16,7 +16,8 @@ services:
       - ./data/test_audio_chunks:/app/audio_chunks
       - ./data/test_debug_dir:/app/debug  # Fixed: mount to /app/debug for plugin database
       - ./data/test_data:/app/data
-      - ${CONFIG_FILE:-../../config/config.yml}:/app/config.yml  # Mount config.yml for model registry and memory settings (writable for admin config updates)
+      - ../../config:/app/config  # Mount config directory with defaults.yml
+      - ${CONFIG_FILE:-../../config/config.yml}:/app/config.yml  # Override main config (for test-specific configs)
       - ${PLUGINS_CONFIG:-../../tests/config/plugins.test.yml}:/app/plugins.yml  # Mount test plugins config
     environment:
       # Override with test-specific settings
@@ -168,7 +169,8 @@ services:
       - ./data/test_audio_chunks:/app/audio_chunks
       - ./data/test_debug_dir:/app/debug  # Fixed: mount to /app/debug for plugin database
       - ./data/test_data:/app/data
-      - ${CONFIG_FILE:-../../config/config.yml}:/app/config.yml  # Mount config.yml for model registry and memory settings (writable for admin config updates)
+      - ../../config:/app/config  # Mount config directory with defaults.yml
+      - ${CONFIG_FILE:-../../config/config.yml}:/app/config.yml  # Override main config (for test-specific configs)
       - ${PLUGINS_CONFIG:-../../tests/config/plugins.test.yml}:/app/plugins.yml  # Mount test plugins config
     environment:
       # Same environment as backend
diff --git a/backends/advanced/docker-compose.yml b/backends/advanced/docker-compose.yml
index ceaaf6a8..ed9e8356 100644
--- a/backends/advanced/docker-compose.yml
+++ b/backends/advanced/docker-compose.yml
@@ -39,8 +39,7 @@ services:
       - ./data/audio_chunks:/app/audio_chunks
       - ./data/debug_dir:/app/debug_dir
       - ./data:/app/data
-      - ../../config/config.yml:/app/config.yml  # Main config file
-      - ../../config/plugins.yml:/app/plugins.yml  # Plugin configuration
+      - ../../config:/app/config  # Mount entire config directory (includes config.yml, defaults.yml, plugins.yml)
     environment:
       - DEEPGRAM_API_KEY=${DEEPGRAM_API_KEY}
       - PARAKEET_ASR_URL=${PARAKEET_ASR_URL}
@@ -94,8 +93,7 @@ services:
       - ./worker_orchestrator.py:/app/worker_orchestrator.py
       - ./data/audio_chunks:/app/audio_chunks
       - ./data:/app/data
-      - ../../config/config.yml:/app/config.yml
-      - ../../config/plugins.yml:/app/plugins.yml
+      - ../../config:/app/config  # Mount entire config directory (includes config.yml, defaults.yml, plugins.yml)
     environment:
       - DEEPGRAM_API_KEY=${DEEPGRAM_API_KEY}
       - PARAKEET_ASR_URL=${PARAKEET_ASR_URL}
diff --git a/backends/advanced/src/advanced_omi_backend/app_factory.py b/backends/advanced/src/advanced_omi_backend/app_factory.py
index b8bc3e80..cf44ba34 100644
--- a/backends/advanced/src/advanced_omi_backend/app_factory.py
+++ b/backends/advanced/src/advanced_omi_backend/app_factory.py
@@ -56,10 +56,11 @@ async def lifespan(app: FastAPI):
         from advanced_omi_backend.models.conversation import Conversation
         from advanced_omi_backend.models.audio_chunk import AudioChunkDocument
         from advanced_omi_backend.models.user import User
+        from advanced_omi_backend.models.waveform import WaveformData
 
         await init_beanie(
             database=config.db,
-            document_models=[User, Conversation, AudioChunkDocument],
+            document_models=[User, Conversation, AudioChunkDocument, WaveformData],
         )
         application_logger.info("Beanie initialized for all document models")
     except Exception as e:
diff --git a/backends/advanced/src/advanced_omi_backend/config.py b/backends/advanced/src/advanced_omi_backend/config.py
index f335b8be..543baeeb 100644
--- a/backends/advanced/src/advanced_omi_backend/config.py
+++ b/backends/advanced/src/advanced_omi_backend/config.py
@@ -9,6 +9,7 @@
 import logging
 import os
 import shutil
+import yaml
 from dataclasses import dataclass, asdict
 from pathlib import Path
 from typing import Optional
@@ -60,17 +61,149 @@ def get_diarization_config_path():
     data_path = Path("/app/data/diarization_config.json")
     if data_path.parent.exists():
         return data_path
-    
+
     # 2. App root directory
     app_path = Path("/app/diarization_config.json")
     if app_path.parent.exists():
         return app_path
-    
+
     # 3. Local development path
     local_path = Path("diarization_config.json")
     return local_path
 
 
+# ============================================================================
+# Configuration Merging System (for defaults.yml + config.yml)
+# ============================================================================
+
+def get_config_dir() -> Path:
+    """
+    Get config directory path. Single source of truth for config location.
+    Matches root config_manager.py logic.
+
+    Returns:
+        Path to config directory
+    """
+    config_dir = os.getenv("CONFIG_DIR", "/app/config")
+    return Path(config_dir)
+
+
+def get_config_yml_path() -> Path:
+    """Get path to config.yml file."""
+    return get_config_dir() / "config.yml"
+
+
+def get_defaults_yml_path() -> Path:
+    """Get path to defaults.yml file."""
+    return get_config_dir() / "defaults.yml"
+
+
+def get_defaults_config_path():
+    """
+    Get the path to the defaults config file.
+
+    DEPRECATED: Use get_defaults_yml_path() instead.
+    Kept for backward compatibility.
+    """
+    defaults_path = get_defaults_yml_path()
+    return defaults_path if defaults_path.exists() else None
+
+
+def merge_configs(defaults: dict, overrides: dict) -> dict:
+    """
+    Deep merge two configuration dictionaries.
+
+    Override values take precedence over defaults.
+    Lists are replaced (not merged).
+
+    Args:
+        defaults: Default configuration values
+        overrides: User-provided overrides
+
+    Returns:
+        Merged configuration dictionary
+    """
+    result = defaults.copy()
+
+    for key, value in overrides.items():
+        if key in result and isinstance(result[key], dict) and isinstance(value, dict):
+            # Recursively merge dictionaries
+            result[key] = merge_configs(result[key], value)
+        else:
+            # Override (lists, scalars, new keys)
+            result[key] = value
+
+    return result
+
+
+# Global cache for merged config
+_config_cache: Optional[dict] = None
+
+
+def get_config(force_reload: bool = False) -> dict:
+    """
+    Get merged configuration from defaults.yml + config.yml.
+
+    Priority order: config.yml > environment variables > defaults.yml
+
+    Args:
+        force_reload: If True, reload from disk even if cached
+
+    Returns:
+        Merged configuration dictionary with all settings
+    """
+    global _config_cache
+
+    if _config_cache is not None and not force_reload:
+        return _config_cache
+
+    # Load defaults
+    defaults_path = get_defaults_yml_path()
+    defaults = {}
+    if defaults_path.exists():
+        try:
+            with open(defaults_path, 'r') as f:
+                defaults = yaml.safe_load(f) or {}
+            logger.info(f"Loaded defaults from {defaults_path}")
+        except Exception as e:
+            logger.warning(f"Could not load defaults from {defaults_path}: {e}")
+
+    # Load user config
+    config_path = get_config_yml_path()
+    user_config = {}
+    if config_path.exists():
+        try:
+            with open(config_path, 'r') as f:
+                user_config = yaml.safe_load(f) or {}
+            logger.info(f"Loaded config from {config_path}")
+        except Exception as e:
+            logger.error(f"Error loading config from {config_path}: {e}")
+
+    # Merge configurations
+    merged = merge_configs(defaults, user_config)
+
+    # Resolve environment variables (lazy import to avoid circular dependency)
+    try:
+        from advanced_omi_backend.model_registry import _deep_resolve_env
+        merged = _deep_resolve_env(merged)
+    except ImportError:
+        # If model_registry not available, skip env resolution
+        # (will be resolved when model_registry loads the config)
+        logger.warning("Could not import _deep_resolve_env, environment variables may not be resolved")
+
+    # Cache result
+    _config_cache = merged
+
+    return merged
+
+
+def reload_config():
+    """Reload configuration from disk (invalidate cache)."""
+    global _config_cache
+    _config_cache = None
+    return get_config(force_reload=True)
+
+
 def load_diarization_settings_from_file():
     """Load diarization settings from file or create from template."""
     global _diarization_settings
diff --git a/backends/advanced/src/advanced_omi_backend/controllers/audio_controller.py b/backends/advanced/src/advanced_omi_backend/controllers/audio_controller.py
index c0640841..3a2a8af8 100644
--- a/backends/advanced/src/advanced_omi_backend/controllers/audio_controller.py
+++ b/backends/advanced/src/advanced_omi_backend/controllers/audio_controller.py
@@ -144,11 +144,30 @@ async def upload_and_process_audio_files(
                         f"📦 Converted uploaded file to {num_chunks} MongoDB chunks "
                         f"(conversation {conversation_id[:12]})"
                     )
+                except ValueError as val_error:
+                    # Handle validation errors (e.g., file too long)
+                    audio_logger.error(f"Audio validation failed: {val_error}")
+                    processed_files.append({
+                        "filename": file.filename,
+                        "status": "error",
+                        "error": str(val_error),
+                    })
+                    # Delete the conversation since it won't have audio chunks
+                    await conversation.delete()
+                    continue
                 except Exception as chunk_error:
                     audio_logger.error(
                         f"Failed to convert uploaded file to chunks: {chunk_error}",
                         exc_info=True
                     )
+                    processed_files.append({
+                        "filename": file.filename,
+                        "status": "error",
+                        "error": f"Audio conversion failed: {str(chunk_error)}",
+                    })
+                    # Delete the conversation since it won't have audio chunks
+                    await conversation.delete()
+                    continue
 
                 # Enqueue batch transcription job first (file uploads need transcription)
                 from advanced_omi_backend.controllers.queue_controller import (
diff --git a/backends/advanced/src/advanced_omi_backend/controllers/conversation_controller.py b/backends/advanced/src/advanced_omi_backend/controllers/conversation_controller.py
index b6268c64..de7e046e 100644
--- a/backends/advanced/src/advanced_omi_backend/controllers/conversation_controller.py
+++ b/backends/advanced/src/advanced_omi_backend/controllers/conversation_controller.py
@@ -130,18 +130,26 @@ async def get_conversation(conversation_id: str, user: User):
         return JSONResponse(status_code=500, content={"error": "Error fetching conversation"})
 
 
-async def get_conversations(user: User):
+async def get_conversations(user: User, include_deleted: bool = False):
     """Get conversations with speech only (speech-driven architecture)."""
     try:
         # Build query based on user permissions using Beanie
         if not user.is_superuser:
             # Regular users can only see their own conversations
-            user_conversations = await Conversation.find(
-                Conversation.user_id == str(user.user_id)
-            ).sort(-Conversation.created_at).to_list()
+            # Filter by deleted status
+            query = Conversation.user_id == str(user.user_id)
+            if not include_deleted:
+                query = query & (Conversation.deleted == False)
+            user_conversations = await Conversation.find(query).sort(-Conversation.created_at).to_list()
         else:
             # Admins see all conversations
-            user_conversations = await Conversation.find_all().sort(-Conversation.created_at).to_list()
+            # Filter by deleted status
+            if not include_deleted:
+                user_conversations = await Conversation.find(
+                    Conversation.deleted == False
+                ).sort(-Conversation.created_at).to_list()
+            else:
+                user_conversations = await Conversation.find_all().sort(-Conversation.created_at).to_list()
 
         # Build response with explicit curated fields - minimal for list view
         conversations = []
diff --git a/backends/advanced/src/advanced_omi_backend/model_registry.py b/backends/advanced/src/advanced_omi_backend/model_registry.py
index 18f464ae..d0a46ab6 100644
--- a/backends/advanced/src/advanced_omi_backend/model_registry.py
+++ b/backends/advanced/src/advanced_omi_backend/model_registry.py
@@ -17,6 +17,9 @@
 import logging
 from pydantic import BaseModel, Field, field_validator, model_validator, ConfigDict, ValidationError
 
+# Import config merging for defaults.yml + config.yml integration
+from advanced_omi_backend.config import get_config
+
 def _resolve_env(value: Any) -> Any:
     """Resolve ``${VAR:-default}`` patterns inside a single value.
     
@@ -250,54 +253,31 @@ def list_model_types(self) -> List[str]:
 
 
 def _find_config_path() -> Path:
-    """Find config.yml in expected locations.
-    
-    Search order:
-    1. CONFIG_FILE environment variable
-    2. Current working directory
-    3. /app/config.yml (Docker container)
-    4. Walk up from module directory
-    
-    Returns:
-        Path to config.yml (may not exist)
     """
-    # ENV override
-    cfg_env = os.getenv("CONFIG_FILE")
-    if cfg_env and Path(cfg_env).exists():
-        return Path(cfg_env)
+    Find config.yml using canonical path from config module.
 
-    # Common locations (container vs repo root)
-    candidates = [Path("config.yml"), Path("/app/config.yml")]
+    DEPRECATED: Use advanced_omi_backend.config.get_config_yml_path() directly.
+    Kept for backward compatibility.
 
-    # Also walk up from current file's parents defensively
-    try:
-        for parent in Path(__file__).resolve().parents:
-            c = parent / "config.yml"
-            if c.exists():
-                return c
-    except Exception:
-        pass
-
-    for c in candidates:
-        if c.exists():
-            return c
-    
-    # Last resort: return /app/config.yml path (may not exist yet)
-    return Path("/app/config.yml")
+    Returns:
+        Path to config.yml
+    """
+    from advanced_omi_backend.config import get_config_yml_path
+    return get_config_yml_path()
 
 
 def load_models_config(force_reload: bool = False) -> Optional[AppModels]:
-    """Load model configuration from config.yml.
-    
-    This function loads and parses the config.yml file, resolves environment
-    variables, validates model definitions using Pydantic, and caches the result.
-    
+    """Load model configuration from merged defaults.yml + config.yml.
+
+    This function loads defaults.yml and config.yml, merges them with user overrides,
+    resolves environment variables, validates model definitions using Pydantic, and caches the result.
+
     Args:
         force_reload: If True, reload from disk even if already cached
-        
+
     Returns:
         AppModels instance with validated configuration, or None if config not found
-        
+
     Raises:
         ValidationError: If config.yml has invalid model definitions
         yaml.YAMLError: If config.yml has invalid YAML syntax
@@ -306,16 +286,18 @@ def load_models_config(force_reload: bool = False) -> Optional[AppModels]:
     if _REGISTRY is not None and not force_reload:
         return _REGISTRY
 
-    cfg_path = _find_config_path()
-    if not cfg_path.exists():
-        return None
-
-    # Load and parse YAML
-    with cfg_path.open("r") as f:
-        raw = yaml.safe_load(f) or {}
-    
-    # Resolve environment variables
-    raw = _deep_resolve_env(raw)
+    # Try to get merged configuration (defaults + user config)
+    try:
+        raw = get_config(force_reload=force_reload)
+    except Exception as e:
+        logging.error(f"Failed to load merged configuration: {e}")
+        # Fallback to direct config.yml loading
+        cfg_path = _find_config_path()
+        if not cfg_path.exists():
+            return None
+        with cfg_path.open("r") as f:
+            raw = yaml.safe_load(f) or {}
+        raw = _deep_resolve_env(raw)
 
     # Extract sections
     defaults = raw.get("defaults", {}) or {}
diff --git a/backends/advanced/src/advanced_omi_backend/models/job.py b/backends/advanced/src/advanced_omi_backend/models/job.py
index 763373d2..f2d85add 100644
--- a/backends/advanced/src/advanced_omi_backend/models/job.py
+++ b/backends/advanced/src/advanced_omi_backend/models/job.py
@@ -37,6 +37,7 @@ async def _ensure_beanie_initialized():
             from advanced_omi_backend.models.conversation import Conversation
             from advanced_omi_backend.models.audio_chunk import AudioChunkDocument
             from advanced_omi_backend.models.user import User
+            from advanced_omi_backend.models.waveform import WaveformData
             from pymongo.errors import ConfigurationError
 
             # Get MongoDB URI from environment
@@ -54,7 +55,7 @@ async def _ensure_beanie_initialized():
             # Initialize Beanie
             await init_beanie(
                 database=database,
-                document_models=[User, Conversation, AudioChunkDocument],
+                document_models=[User, Conversation, AudioChunkDocument, WaveformData],
             )
 
             _beanie_initialized = True
diff --git a/backends/advanced/src/advanced_omi_backend/models/waveform.py b/backends/advanced/src/advanced_omi_backend/models/waveform.py
new file mode 100644
index 00000000..caf6fd49
--- /dev/null
+++ b/backends/advanced/src/advanced_omi_backend/models/waveform.py
@@ -0,0 +1,47 @@
+"""
+Waveform visualization data model for conversations.
+
+This module provides the WaveformData model for storing pre-computed
+waveform visualization data, enabling UI to display audio waveforms
+without real-time decoding.
+"""
+
+from datetime import datetime
+from typing import List, Optional
+
+from beanie import Document, Indexed
+from pydantic import Field
+
+
+class WaveformData(Document):
+    """Pre-computed waveform visualization for conversations."""
+
+    # Link to parent conversation
+    conversation_id: Indexed(str) = Field(
+        description="Parent conversation ID (unique per conversation)"
+    )
+
+    # Waveform amplitude data
+    samples: List[float] = Field(
+        description="Amplitude samples normalized to [-1.0, 1.0] range"
+    )
+    sample_rate: int = Field(
+        description="Samples per second (e.g., 10 = 1 sample per 100ms)"
+    )
+
+    # Metadata
+    duration_seconds: float = Field(description="Total audio duration in seconds")
+    created_at: datetime = Field(
+        default_factory=datetime.utcnow,
+        description="When this waveform was generated"
+    )
+    processing_time_seconds: Optional[float] = Field(
+        None,
+        description="Time taken to generate waveform"
+    )
+
+    class Settings:
+        name = "waveforms"
+        indexes = [
+            "conversation_id",  # Unique lookup by conversation
+        ]
diff --git a/backends/advanced/src/advanced_omi_backend/routers/modules/audio_routes.py b/backends/advanced/src/advanced_omi_backend/routers/modules/audio_routes.py
index afa2906f..78231da6 100644
--- a/backends/advanced/src/advanced_omi_backend/routers/modules/audio_routes.py
+++ b/backends/advanced/src/advanced_omi_backend/routers/modules/audio_routes.py
@@ -7,8 +7,8 @@
 
 import io
 from typing import Optional
-from fastapi import APIRouter, Depends, File, HTTPException, Query, UploadFile
-from fastapi.responses import FileResponse, StreamingResponse
+from fastapi import APIRouter, Depends, File, HTTPException, Query, UploadFile, Request
+from fastapi.responses import FileResponse, StreamingResponse, Response
 
 from advanced_omi_backend.auth import current_superuser, current_active_user_optional, get_user_from_token_param
 from advanced_omi_backend.controllers import audio_controller
@@ -46,6 +46,7 @@ async def upload_audio_from_drive_folder(
 @router.get("/get_audio/{conversation_id}")
 async def get_conversation_audio(
     conversation_id: str,
+    request: Request,
     token: Optional[str] = Query(default=None, description="JWT token for audio element access"),
     current_user: Optional[User] = Depends(current_active_user_optional),
 ):
@@ -106,17 +107,60 @@ async def get_conversation_audio(
             detail=f"Failed to reconstruct audio: {str(e)}"
         )
 
-    # Serve as WAV file
-    return StreamingResponse(
-        io.BytesIO(wav_data),
-        media_type="audio/wav",
-        headers={
-            "Content-Disposition": f"inline; filename={conversation_id}.wav",
-            "Content-Length": str(len(wav_data)),
-            "X-Audio-Source": "mongodb-chunks",
-            "X-Chunk-Count": str(conversation.audio_chunks_count or 0),
-        }
-    )
+    # Handle Range requests for seeking support
+    file_size = len(wav_data)
+    range_header = request.headers.get("range")
+
+    # If no Range header, return complete file
+    if not range_header:
+        return StreamingResponse(
+            io.BytesIO(wav_data),
+            media_type="audio/wav",
+            headers={
+                "Content-Disposition": f"inline; filename={conversation_id}.wav",
+                "Content-Length": str(file_size),
+                "Accept-Ranges": "bytes",
+                "X-Audio-Source": "mongodb-chunks",
+                "X-Chunk-Count": str(conversation.audio_chunks_count or 0),
+            }
+        )
+
+    # Parse Range header (e.g., "bytes=0-1023")
+    try:
+        range_str = range_header.replace("bytes=", "")
+        range_start, range_end = range_str.split("-")
+        range_start = int(range_start) if range_start else 0
+        range_end = int(range_end) if range_end else file_size - 1
+
+        # Ensure valid range
+        range_start = max(0, range_start)
+        range_end = min(file_size - 1, range_end)
+        content_length = range_end - range_start + 1
+
+        # Extract requested byte range
+        range_data = wav_data[range_start:range_end + 1]
+
+        # Return 206 Partial Content with Range headers
+        return Response(
+            content=range_data,
+            status_code=206,
+            media_type="audio/wav",
+            headers={
+                "Content-Range": f"bytes {range_start}-{range_end}/{file_size}",
+                "Content-Length": str(content_length),
+                "Accept-Ranges": "bytes",
+                "Content-Disposition": f"inline; filename={conversation_id}.wav",
+                "X-Audio-Source": "mongodb-chunks",
+            }
+        )
+    except (ValueError, IndexError) as e:
+        # Invalid Range header, return 416 Range Not Satisfiable
+        return Response(
+            status_code=416,
+            headers={
+                "Content-Range": f"bytes */{file_size}"
+            }
+        )
 
 
 @router.get("/stream_audio/{conversation_id}")
diff --git a/backends/advanced/src/advanced_omi_backend/routers/modules/conversation_routes.py b/backends/advanced/src/advanced_omi_backend/routers/modules/conversation_routes.py
index c529162d..3f48fe1c 100644
--- a/backends/advanced/src/advanced_omi_backend/routers/modules/conversation_routes.py
+++ b/backends/advanced/src/advanced_omi_backend/routers/modules/conversation_routes.py
@@ -28,9 +28,12 @@ async def close_current_conversation(
 
 
 @router.get("")
-async def get_conversations(current_user: User = Depends(current_active_user)):
+async def get_conversations(
+    include_deleted: bool = Query(False, description="Include soft-deleted conversations"),
+    current_user: User = Depends(current_active_user)
+):
     """Get conversations. Admins see all conversations, users see only their own."""
-    return await conversation_controller.get_conversations(current_user)
+    return await conversation_controller.get_conversations(current_user, include_deleted)
 
 
 @router.get("/{conversation_id}")
@@ -89,6 +92,79 @@ async def get_conversation_version_history(
     return await conversation_controller.get_conversation_version_history(conversation_id, current_user)
 
 
+@router.get("/{conversation_id}/waveform")
+async def get_conversation_waveform(
+    conversation_id: str,
+    current_user: User = Depends(current_active_user)
+):
+    """
+    Get or generate waveform visualization data for a conversation.
+
+    This endpoint implements lazy generation:
+    1. Check if waveform already exists in database
+    2. If exists, return cached version immediately
+    3. If not, generate synchronously and cache in database
+    4. Return waveform data
+
+    The waveform contains amplitude samples normalized to [-1.0, 1.0] range
+    for visualization in the UI without needing to decode audio chunks.
+
+    Returns:
+        - samples: List[float] - Amplitude samples normalized to [-1, 1]
+        - sample_rate: int - Samples per second (10)
+        - duration_seconds: float - Total audio duration
+    """
+    from fastapi import HTTPException
+    from advanced_omi_backend.models.conversation import Conversation
+    from advanced_omi_backend.models.waveform import WaveformData
+    from advanced_omi_backend.workers.waveform_jobs import generate_waveform_data
+
+    # Verify conversation exists and user has access
+    conversation = await Conversation.find_one(
+        Conversation.conversation_id == conversation_id
+    )
+
+    if not conversation:
+        raise HTTPException(status_code=404, detail="Conversation not found")
+
+    # Check ownership (admins can access all)
+    if not current_user.is_superuser and conversation.user_id != str(current_user.id):
+        raise HTTPException(status_code=403, detail="Access denied")
+
+    # Check for existing waveform in database
+    waveform = await WaveformData.find_one(
+        WaveformData.conversation_id == conversation_id
+    )
+
+    # If waveform exists, return cached version
+    if waveform:
+        logger.info(f"Returning cached waveform for conversation {conversation_id[:12]}")
+        return waveform.model_dump(exclude={"id", "revision_id"})
+
+    # Generate waveform on-demand
+    logger.info(f"Generating waveform on-demand for conversation {conversation_id[:12]}")
+
+    waveform_dict = await generate_waveform_data(
+        conversation_id=conversation_id,
+        sample_rate=3
+    )
+
+    if not waveform_dict.get("success"):
+        error_msg = waveform_dict.get("error", "Unknown error")
+        logger.error(f"Waveform generation failed: {error_msg}")
+        raise HTTPException(
+            status_code=500,
+            detail=f"Waveform generation failed: {error_msg}"
+        )
+
+    # Return generated waveform (already saved to database by generator)
+    return {
+        "samples": waveform_dict["samples"],
+        "sample_rate": waveform_dict["sample_rate"],
+        "duration_seconds": waveform_dict["duration_seconds"]
+    }
+
+
 @router.delete("/{conversation_id}")
 async def delete_conversation(
     conversation_id: str,
diff --git a/backends/advanced/src/advanced_omi_backend/services/audio_stream/aggregator.py b/backends/advanced/src/advanced_omi_backend/services/audio_stream/aggregator.py
index f31f7453..19b76874 100644
--- a/backends/advanced/src/advanced_omi_backend/services/audio_stream/aggregator.py
+++ b/backends/advanced/src/advanced_omi_backend/services/audio_stream/aggregator.py
@@ -107,24 +107,56 @@ async def get_combined_results(self, session_id: str) -> dict:
                 "provider": None
             }
 
-        # For streaming providers (Deepgram), use ONLY the latest final result
-        # Each is_final=true result supersedes interim results for the same speech segment
-        # The latest result contains the most accurate transcription with best timing/confidence
-        latest_result = results[-1]
+        # Combine ALL final results for cumulative speech detection
+        # Each result represents a sequential segment of speech
+        all_text = []
+        all_words = []
+        all_segments = []
+        total_confidence = 0.0
+        provider = None
+
+        for result in results:
+            # Accumulate text
+            text = result.get("text", "").strip()
+            if text:
+                all_text.append(text)
+
+            # Accumulate words with timing data
+            words = result.get("words", [])
+            if words:
+                all_words.extend(words)
+
+            # Accumulate segments
+            segments = result.get("segments", [])
+            if segments:
+                all_segments.extend(segments)
+
+            # Sum confidence for averaging
+            total_confidence += result.get("confidence", 0.0)
+
+            # Get provider from first result
+            if provider is None:
+                provider = result.get("provider")
+
+        # Calculate average confidence
+        avg_confidence = total_confidence / len(results) if results else 0.0
+
+        # Join all text segments with spaces
+        combined_text = " ".join(all_text)
 
         combined = {
-            "text": latest_result.get("text", ""),
-            "words": latest_result.get("words", []),
-            "segments": latest_result.get("segments", []),
-            "chunk_count": len(results),  # Track how many results were received
-            "total_confidence": latest_result.get("confidence", 0.0),
-            "provider": latest_result.get("provider")
+            "text": combined_text,
+            "words": all_words,
+            "segments": all_segments,
+            "chunk_count": len(results),
+            "total_confidence": avg_confidence,
+            "provider": provider
         }
 
         logger.info(
             f"🔤 TRANSCRIPT [AGGREGATOR] session={session_id}, "
             f"total_results={len(results)}, words={len(combined['words'])}, "
-            f"text=\"{combined['text']}\""
+            f"text_length={len(combined_text)} chars"
         )
 
         return combined
diff --git a/backends/advanced/src/advanced_omi_backend/services/audio_stream/producer.py b/backends/advanced/src/advanced_omi_backend/services/audio_stream/producer.py
index 1fa06011..6ec4fad4 100644
--- a/backends/advanced/src/advanced_omi_backend/services/audio_stream/producer.py
+++ b/backends/advanced/src/advanced_omi_backend/services/audio_stream/producer.py
@@ -218,7 +218,7 @@ async def mark_websocket_disconnected(self, session_id: str):
 
     async def finalize_session(self, session_id: str):
         """
-        Mark session as finalizing and clean up buffer.
+        Mark session as finalizing, send end marker, and clean up buffer.
 
         Args:
             session_id: Session identifier
@@ -230,8 +230,29 @@ async def finalize_session(self, session_id: str):
             "finalized_at": str(time.time())
         })
 
-        # Clean up session buffer
+        # Send end_marker to Redis stream so streaming consumer can close the connection
         if session_id in self.session_buffers:
+            buffer = self.session_buffers[session_id]
+            stream_name = buffer["stream_name"]
+
+            # Send end_marker message to signal stream end
+            end_marker_data = {
+                b"end_marker": b"true",
+                b"session_id": session_id.encode(),
+                b"user_id": buffer["user_id"].encode(),
+                b"client_id": buffer["client_id"].encode(),
+                b"timestamp": str(time.time()).encode(),
+            }
+
+            await self.redis_client.xadd(
+                stream_name,
+                end_marker_data,
+                maxlen=25000,
+                approximate=True
+            )
+            logger.info(f"📡 Sent end_marker to {stream_name} for session {session_id}")
+
+            # Clean up session buffer
             del self.session_buffers[session_id]
             logger.debug(f"🧹 Cleaned up buffer for session {session_id}")
 
diff --git a/backends/advanced/src/advanced_omi_backend/services/memory/README.md b/backends/advanced/src/advanced_omi_backend/services/memory/README.md
index 1a1cad3b..ba6de6a4 100644
--- a/backends/advanced/src/advanced_omi_backend/services/memory/README.md
+++ b/backends/advanced/src/advanced_omi_backend/services/memory/README.md
@@ -448,11 +448,11 @@ OPENAI_API_KEY=your_openai_key
 OPENAI_BASE_URL=https://api.openai.com/v1
 OLLAMA_BASE_URL=http://localhost:11434
 
-# Vector Store Configuration  
+# Vector Store Configuration
 VECTOR_STORE_PROVIDER=qdrant
 QDRANT_BASE_URL=localhost
 QDRANT_PORT=6333
-QDRANT_COLLECTION_NAME=omi_memories
+QDRANT_COLLECTION_NAME=chronicle_memories
 
 # Memory Service Settings
 MEMORY_EXTRACTION_ENABLED=true
diff --git a/backends/advanced/src/advanced_omi_backend/services/memory/base.py b/backends/advanced/src/advanced_omi_backend/services/memory/base.py
index e88e42d4..4abdb5b0 100644
--- a/backends/advanced/src/advanced_omi_backend/services/memory/base.py
+++ b/backends/advanced/src/advanced_omi_backend/services/memory/base.py
@@ -25,17 +25,18 @@
 @dataclass
 class MemoryEntry:
     """Represents a memory entry with content, metadata, and embeddings.
-    
+
     This is the core data structure used throughout the memory service
     for storing and retrieving user memories.
-    
+
     Attributes:
         id: Unique identifier for the memory
         content: The actual memory text/content
         metadata: Additional metadata (user_id, source, timestamps, etc.)
         embedding: Vector embedding for semantic search (optional)
-        score: Similarity score from search operations (optional) 
+        score: Similarity score from search operations (optional)
         created_at: Timestamp when memory was created
+        updated_at: Timestamp when memory was last updated
     """
     id: str
     content: str
@@ -43,11 +44,15 @@ class MemoryEntry:
     embedding: Optional[List[float]] = None
     score: Optional[float] = None
     created_at: Optional[str] = None
-    
+    updated_at: Optional[str] = None
+
     def __post_init__(self):
-        """Set created_at timestamp if not provided."""
+        """Set created_at and updated_at timestamps if not provided."""
+        current_time = str(int(time.time()))
         if self.created_at is None:
-            self.created_at = str(int(time.time()))
+            self.created_at = current_time
+        if self.updated_at is None:
+            self.updated_at = self.created_at  # Default to created_at, not current_time
 
     def to_dict(self) -> Dict[str, Any]:
         """Convert MemoryEntry to dictionary for JSON serialization."""
@@ -59,6 +64,7 @@ def to_dict(self) -> Dict[str, Any]:
             "embedding": self.embedding,
             "score": self.score,
             "created_at": self.created_at,
+            "updated_at": self.updated_at,
             "user_id": self.metadata.get("user_id")  # Extract user_id from metadata
         }
 
diff --git a/backends/advanced/src/advanced_omi_backend/services/memory/config.py b/backends/advanced/src/advanced_omi_backend/services/memory/config.py
index e48b8fb5..19b47bd7 100644
--- a/backends/advanced/src/advanced_omi_backend/services/memory/config.py
+++ b/backends/advanced/src/advanced_omi_backend/services/memory/config.py
@@ -65,22 +65,27 @@ class MemoryConfig:
 
 
 def load_config_yml() -> Dict[str, Any]:
-    """Load config.yml from standard locations."""
-    # Check /app/config.yml (Docker) or root relative to file
-    current_dir = Path(__file__).parent.resolve()
-    # Path inside Docker: /app/config.yml (if mounted) or ../../../config.yml relative to src
-    paths = [
-        Path("/app/config.yml"),
-        current_dir.parent.parent.parent.parent.parent / "config.yml",  # Relative to src/
-        Path("./config.yml"),
-    ]
+    """
+    Load config.yml using canonical path from config module.
+
+    Returns:
+        Loaded config.yml as dictionary
+
+    Raises:
+        FileNotFoundError: If config.yml does not exist
+    """
+    from advanced_omi_backend.config import get_config_yml_path
+
+    config_path = get_config_yml_path()
 
-    for path in paths:
-        if path.exists():
-            with open(path, "r") as f:
-                return yaml.safe_load(f) or {}
+    if not config_path.exists():
+        raise FileNotFoundError(
+            f"config.yml not found at {config_path}. "
+            "Ensure config directory is mounted correctly."
+        )
 
-    raise FileNotFoundError(f"config.yml not found in any of: {[str(p) for p in paths]}")
+    with open(config_path, "r") as f:
+        return yaml.safe_load(f) or {}
 
 
 def create_openmemory_config(
@@ -135,7 +140,7 @@ def create_openai_config(
 def create_qdrant_config(
     host: str = "localhost",
     port: int = 6333,
-    collection_name: str = "omi_memories",
+    collection_name: str = "chronicle_memories",
     embedding_dims: int = 1536,
 ) -> Dict[str, Any]:
     """Create Qdrant vector store configuration."""
@@ -258,7 +263,7 @@ def build_memory_config_from_env() -> MemoryConfig:
 
         host = str(vs_def.model_params.get("host", "qdrant"))
         port = int(vs_def.model_params.get("port", 6333))
-        collection_name = str(vs_def.model_params.get("collection_name", "omi_memories"))
+        collection_name = str(vs_def.model_params.get("collection_name", "chronicle_memories"))
         vector_store_config = create_qdrant_config(
             host=host,
             port=port,
diff --git a/backends/advanced/src/advanced_omi_backend/services/memory/providers/chronicle.py b/backends/advanced/src/advanced_omi_backend/services/memory/providers/chronicle.py
index 3fb96f00..fa73c526 100644
--- a/backends/advanced/src/advanced_omi_backend/services/memory/providers/chronicle.py
+++ b/backends/advanced/src/advanced_omi_backend/services/memory/providers/chronicle.py
@@ -277,12 +277,12 @@ async def get_all_memories(self, user_id: str, limit: int = 100) -> List[MemoryE
 
     async def count_memories(self, user_id: str) -> Optional[int]:
         """Count total number of memories for a user.
-        
+
         Uses the vector store's native count capabilities.
-        
+
         Args:
             user_id: User identifier
-            
+
         Returns:
             Total count of memories for the user, or None if not supported
         """
@@ -297,6 +297,30 @@ async def count_memories(self, user_id: str) -> Optional[int]:
             memory_logger.error(f"Count memories failed: {e}")
             return None
 
+    async def get_memory(self, memory_id: str, user_id: Optional[str] = None) -> Optional[MemoryEntry]:
+        """Get a specific memory by ID.
+
+        Args:
+            memory_id: Unique identifier of the memory to retrieve
+            user_id: Optional user ID for authentication/filtering
+
+        Returns:
+            MemoryEntry object if found, None otherwise
+        """
+        if not self._initialized:
+            await self.initialize()
+
+        try:
+            memory = await self.vector_store.get_memory(memory_id, user_id)
+            if memory:
+                memory_logger.info(f"📄 Retrieved memory {memory_id}")
+            else:
+                memory_logger.debug(f"Memory {memory_id} not found")
+            return memory
+        except Exception as e:
+            memory_logger.error(f"Get memory failed: {e}")
+            return None
+
     async def delete_memory(self, memory_id: str, user_id: Optional[str] = None, user_email: Optional[str] = None) -> bool:
         """Delete a specific memory by ID.
         
@@ -418,7 +442,8 @@ def _create_memory_entries(
             List of MemoryEntry objects ready for storage
         """
         memory_entries = []
-        
+        current_time = str(int(time.time()))
+
         for memory_text, embedding in zip(fact_memories_text, embeddings):
             memory_id = str(uuid.uuid4())
             memory_entries.append(
@@ -435,10 +460,11 @@ def _create_memory_entries(
                         "extraction_enabled": self.config.extraction_enabled,
                     },
                     embedding=embedding,
-                    created_at=str(int(time.time())),
+                    created_at=current_time,
+                    updated_at=current_time,
                 )
             )
-        
+
         return memory_entries
 
     async def _process_memory_updates(
@@ -633,15 +659,17 @@ async def _apply_memory_actions(
                 if emb is None:
                     memory_logger.warning(f"Skipping ADD action due to missing embedding: {action_text}")
                     continue
-                    
+
                 memory_id = str(uuid.uuid4())
+                current_time = str(int(time.time()))
                 memory_entries.append(
                     MemoryEntry(
                         id=memory_id,
                         content=action_text,
                         metadata=base_metadata,
                         embedding=emb,
-                        created_at=str(int(time.time())),
+                        created_at=current_time,
+                        updated_at=current_time,
                     )
                 )
                 memory_logger.info(f"➕ Added new memory: {memory_id} - {action_text[:50]}...")
diff --git a/backends/advanced/src/advanced_omi_backend/services/memory/providers/mycelia.py b/backends/advanced/src/advanced_omi_backend/services/memory/providers/mycelia.py
index 6ace9ad6..6289f035 100644
--- a/backends/advanced/src/advanced_omi_backend/services/memory/providers/mycelia.py
+++ b/backends/advanced/src/advanced_omi_backend/services/memory/providers/mycelia.py
@@ -190,6 +190,7 @@ def _mycelia_object_to_memory_entry(self, obj: Dict, user_id: str) -> MemoryEntr
             content=memory_content,
             metadata=metadata,
             created_at=self._extract_bson_date(obj.get("createdAt")),
+            updated_at=self._extract_bson_date(obj.get("updatedAt")),
         )
 
     async def _call_resource(self, action: str, jwt_token: str, **params) -> Dict[str, Any]:
diff --git a/backends/advanced/src/advanced_omi_backend/services/memory/providers/openmemory_mcp.py b/backends/advanced/src/advanced_omi_backend/services/memory/providers/openmemory_mcp.py
index 2fe34164..510dd019 100644
--- a/backends/advanced/src/advanced_omi_backend/services/memory/providers/openmemory_mcp.py
+++ b/backends/advanced/src/advanced_omi_backend/services/memory/providers/openmemory_mcp.py
@@ -478,19 +478,24 @@ def _mcp_result_to_memory_entry(self, mcp_result: Dict[str, Any], user_id: str)
             
             # Extract similarity score if available (for search results)
             score = mcp_result.get('score') or mcp_result.get('similarity') or mcp_result.get('relevance')
-            
-            # Extract timestamp
+
+            # Extract timestamps
             created_at = mcp_result.get('created_at') or mcp_result.get('timestamp') or mcp_result.get('date')
             if created_at is None:
                 created_at = str(int(time.time()))
-            
+
+            updated_at = mcp_result.get('updated_at') or mcp_result.get('modified_at')
+            if updated_at is None:
+                updated_at = str(created_at)  # Default to created_at if not provided
+
             return MemoryEntry(
                 id=memory_id,
                 content=content,
                 metadata=metadata,
                 embedding=None,  # OpenMemory MCP server handles embeddings internally
                 score=score,
-                created_at=str(created_at)
+                created_at=str(created_at),
+                updated_at=str(updated_at)
             )
             
         except Exception as e:
diff --git a/backends/advanced/src/advanced_omi_backend/services/memory/providers/vector_stores.py b/backends/advanced/src/advanced_omi_backend/services/memory/providers/vector_stores.py
index 85ee200a..9fed0126 100644
--- a/backends/advanced/src/advanced_omi_backend/services/memory/providers/vector_stores.py
+++ b/backends/advanced/src/advanced_omi_backend/services/memory/providers/vector_stores.py
@@ -123,26 +123,28 @@ async def add_memories(self, memories: List[MemoryEntry]) -> List[str]:
             points = []
             for memory in memories:
                 if memory.embedding:
+                    current_time = str(int(time.time()))
                     point = PointStruct(
                         id=memory.id,
                         vector=memory.embedding,
                         payload={
                             "content": memory.content,
                             "metadata": memory.metadata,
-                            "created_at": memory.created_at or str(int(time.time()))
+                            "created_at": memory.created_at or current_time,
+                            "updated_at": memory.updated_at or current_time
                         }
                     )
                     points.append(point)
-            
+
             if points:
                 await self.client.upsert(
                     collection_name=self.collection_name,
                     points=points
                 )
                 return [str(point.id) for point in points]
-            
+
             return []
-            
+
         except Exception as e:
             memory_logger.error(f"Qdrant add memories failed: {e}")
             return []
@@ -190,7 +192,8 @@ async def search_memories(self, query_embedding: List[float], user_id: str, limi
                     metadata=result.payload.get("metadata", {}),
                     # Qdrant returns similarity scores directly (higher = more similar)
                     score=result.score if result.score is not None else None,
-                    created_at=result.payload.get("created_at")
+                    created_at=result.payload.get("created_at"),
+                    updated_at=result.payload.get("updated_at")
                 )
                 memories.append(memory)
                 # Log similarity scores for debugging
@@ -230,10 +233,11 @@ async def get_memories(self, user_id: str, limit: int) -> List[MemoryEntry]:
                     id=str(point.id),
                     content=point.payload.get("content", ""),
                     metadata=point.payload.get("metadata", {}),
-                    created_at=point.payload.get("created_at")
+                    created_at=point.payload.get("created_at"),
+                    updated_at=point.payload.get("updated_at")
                 )
                 memories.append(memory)
-            
+
             return memories
             
         except Exception as e:
@@ -356,29 +360,91 @@ async def update_memory(
     async def count_memories(self, user_id: str) -> int:
         """Count total number of memories for a user in Qdrant using native count API."""
         try:
-            
+
             search_filter = Filter(
                 must=[
                     FieldCondition(
-                        key="metadata.user_id", 
+                        key="metadata.user_id",
                         match=MatchValue(value=user_id)
                     )
                 ]
             )
-            
+
             # Use Qdrant's native count API (documented in qdrant/qdrant/docs)
             # Count operation: CountPoints -> CountResponse with count result
             result = await self.client.count(
                 collection_name=self.collection_name,
                 count_filter=search_filter
             )
-            
+
             return result.count
-            
+
         except Exception as e:
             memory_logger.error(f"Qdrant count memories failed: {e}")
             return 0
 
+    async def get_memory(self, memory_id: str, user_id: Optional[str] = None) -> Optional[MemoryEntry]:
+        """Get a specific memory by ID from Qdrant.
+
+        Args:
+            memory_id: Unique identifier of the memory to retrieve
+            user_id: Optional user ID for validation (not used in Qdrant filtering)
+
+        Returns:
+            MemoryEntry object if found, None otherwise
+        """
+        try:
+            # Convert memory_id to proper format for Qdrant
+            import uuid
+            try:
+                # Try to parse as UUID first
+                uuid.UUID(memory_id)
+                point_id = memory_id
+            except ValueError:
+                # If not a UUID, try as integer
+                try:
+                    point_id = int(memory_id)
+                except ValueError:
+                    # If neither UUID nor integer, use it as-is
+                    point_id = memory_id
+
+            # Retrieve the point by ID
+            points = await self.client.retrieve(
+                collection_name=self.collection_name,
+                ids=[point_id],
+                with_payload=True,
+                with_vectors=False
+            )
+
+            if not points:
+                memory_logger.debug(f"Memory not found: {memory_id}")
+                return None
+
+            point = points[0]
+
+            # If user_id is provided, validate ownership
+            if user_id:
+                point_user_id = point.payload.get("metadata", {}).get("user_id")
+                if point_user_id != user_id:
+                    memory_logger.warning(f"Memory {memory_id} does not belong to user {user_id}")
+                    return None
+
+            # Convert to MemoryEntry
+            memory = MemoryEntry(
+                id=str(point.id),
+                content=point.payload.get("content", ""),
+                metadata=point.payload.get("metadata", {}),
+                created_at=point.payload.get("created_at"),
+                updated_at=point.payload.get("updated_at")
+            )
+
+            memory_logger.debug(f"Retrieved memory {memory_id}")
+            return memory
+
+        except Exception as e:
+            memory_logger.error(f"Qdrant get memory failed for {memory_id}: {e}")
+            return None
+
 
 
 
diff --git a/backends/advanced/src/advanced_omi_backend/services/transcription/__init__.py b/backends/advanced/src/advanced_omi_backend/services/transcription/__init__.py
index f481ac3f..45773432 100644
--- a/backends/advanced/src/advanced_omi_backend/services/transcription/__init__.py
+++ b/backends/advanced/src/advanced_omi_backend/services/transcription/__init__.py
@@ -132,7 +132,7 @@ async def transcribe(self, audio_data: bytes, sample_rate: int, diarize: bool =
                 channels = data["results"]["channels"]
                 if channels and "alternatives" in channels[0]:
                     alt = channels[0]["alternatives"][0]
-                    logger.info(f"DEBUG Registry: Deepgram alternative keys: {list(alt.keys())}")
+                    logger.debug(f"DEBUG Registry: Deepgram alternative keys: {list(alt.keys())}")
 
         # Extract normalized shape
         text, words, segments = "", [], []
@@ -143,10 +143,42 @@ async def transcribe(self, audio_data: bytes, sample_rate: int, diarize: bool =
             segments = _dotted_get(data, extract.get("segments")) or []
 
             # DEBUG: Log what we extracted
-            logger.info(f"DEBUG Registry: Extracted {len(segments)} segments from response")
+            logger.debug(f"DEBUG Registry: Extracted {len(segments)} segments from response")
             if segments and len(segments) > 0:
-                logger.info(f"DEBUG Registry: First segment keys: {list(segments[0].keys()) if isinstance(segments[0], dict) else 'not a dict'}")
-                logger.info(f"DEBUG Registry: First segment: {segments[0]}")
+                logger.debug(f"DEBUG Registry: First segment keys: {list(segments[0].keys()) if isinstance(segments[0], dict) else 'not a dict'}")
+                logger.debug(f"DEBUG Registry: First segment: {segments[0]}")
+
+            # FIX: Normalize Deepgram segment structure
+            provider = self.model.model_provider.lower() if self.model.model_provider else ""
+            if provider == "deepgram" and segments:
+                normalized_segments = []
+                for seg in segments:
+                    # Deepgram segments may have nested structure
+                    # Extract text from either 'text' or 'transcript' or 'sentences'
+                    text_content = seg.get("text") or seg.get("transcript") or ""
+
+                    # Handle nested sentences structure
+                    if not text_content and "sentences" in seg:
+                        sentences = seg.get("sentences", [])
+                        text_content = " ".join([s.get("text", "") for s in sentences if s.get("text")])
+
+                    # Skip empty segments
+                    if not text_content or not text_content.strip():
+                        logger.debug(f"Skipping empty Deepgram segment: {seg}")
+                        continue
+
+                    # Build normalized segment
+                    normalized_seg = {
+                        "text": text_content.strip(),
+                        "start": seg.get("start", 0.0),
+                        "end": seg.get("end", 0.0),
+                        "speaker": seg.get("speaker", "SPEAKER_00"),
+                        "confidence": seg.get("confidence", 1.0)
+                    }
+                    normalized_segments.append(normalized_seg)
+
+                segments = normalized_segments
+                logger.debug(f"Normalized {len(segments)} Deepgram segments")
 
         return {"text": text, "words": words, "segments": segments}
 
diff --git a/backends/advanced/src/advanced_omi_backend/utils/audio_chunk_utils.py b/backends/advanced/src/advanced_omi_backend/utils/audio_chunk_utils.py
index 7d91495c..2c5e06ed 100644
--- a/backends/advanced/src/advanced_omi_backend/utils/audio_chunk_utils.py
+++ b/backends/advanced/src/advanced_omi_backend/utils/audio_chunk_utils.py
@@ -395,6 +395,154 @@ async def reconstruct_wav_from_conversation(
     return wav_data
 
 
+async def reconstruct_audio_segments(
+    conversation_id: str,
+    segment_duration: float = 900.0,  # 15 minutes
+    overlap: float = 30.0,  # 30 seconds overlap for continuity
+):
+    """
+    Reconstruct audio from MongoDB chunks in time-bounded segments.
+
+    This function yields audio segments from a conversation, allowing
+    processing of large files without loading everything into memory.
+
+    Args:
+        conversation_id: Parent conversation ID
+        segment_duration: Duration of each segment in seconds (default: 900 = 15 minutes)
+        overlap: Overlap between segments in seconds (default: 30)
+
+    Yields:
+        Tuple of (wav_bytes, start_time, end_time) for each segment
+
+    Example:
+        >>> # Process 73-minute conversation in 15-minute chunks
+        >>> async for wav_data, start, end in reconstruct_audio_segments(conv_id):
+        ...     # Process segment (only ~27 MB in memory at a time)
+        ...     result = await process_segment(wav_data, start, end)
+
+    Note:
+        Overlap is added to all segments except the final one, to ensure
+        speaker continuity across segment boundaries. Overlapping regions
+        should be merged during post-processing.
+    """
+    from advanced_omi_backend.models.conversation import Conversation
+
+    # Get conversation metadata
+    conversation = await Conversation.get(conversation_id)
+
+    if not conversation:
+        raise ValueError(f"Conversation {conversation_id} not found")
+
+    total_duration = conversation.audio_total_duration or 0.0
+
+    if total_duration == 0:
+        logger.warning(f"Conversation {conversation_id} has zero duration, no segments to yield")
+        return
+
+    # Get audio format from first chunk
+    first_chunk = await AudioChunkDocument.find_one(
+        AudioChunkDocument.conversation_id == conversation_id
+    )
+
+    if not first_chunk:
+        raise ValueError(f"No audio chunks found for conversation {conversation_id}")
+
+    sample_rate = first_chunk.sample_rate
+    channels = first_chunk.channels
+
+    # Calculate segment boundaries
+    start_time = 0.0
+
+    while start_time < total_duration:
+        # Calculate segment end time with overlap
+        end_time = min(start_time + segment_duration + overlap, total_duration)
+
+        # Get chunks that overlap with this time range
+        # Note: Using start_time and end_time fields from chunks
+        chunks = await AudioChunkDocument.find(
+            AudioChunkDocument.conversation_id == conversation_id,
+            AudioChunkDocument.start_time < end_time,  # Chunk starts before segment ends
+            AudioChunkDocument.end_time > start_time,  # Chunk ends after segment starts
+        ).sort(+AudioChunkDocument.chunk_index).to_list()
+
+        if not chunks:
+            logger.warning(
+                f"No chunks found for time range {start_time:.1f}s - {end_time:.1f}s "
+                f"in conversation {conversation_id[:8]}..."
+            )
+            start_time += segment_duration
+            continue
+
+        # Decode and concatenate chunks
+        pcm_data = await concatenate_chunks_to_pcm(chunks)
+
+        # Build WAV file for this segment
+        wav_bytes = await build_wav_from_pcm(
+            pcm_data=pcm_data,
+            sample_rate=sample_rate,
+            channels=channels,
+        )
+
+        logger.info(
+            f"Yielding segment for {conversation_id[:8]}...: "
+            f"{start_time:.1f}s - {end_time:.1f}s "
+            f"({len(chunks)} chunks, {len(wav_bytes)} bytes)"
+        )
+
+        yield (wav_bytes, start_time, end_time)
+
+        # Move to next segment (no overlap on the starting edge)
+        start_time += segment_duration
+
+
+def filter_transcript_by_time(
+    transcript_data: dict,
+    start_time: float,
+    end_time: float
+) -> dict:
+    """
+    Filter transcript data to only include words within a time range.
+
+    Args:
+        transcript_data: Dict with 'text' and 'words' keys
+        start_time: Start time in seconds
+        end_time: End time in seconds
+
+    Returns:
+        Filtered transcript data with only words in time range
+
+    Example:
+        >>> transcript = {"text": "full text", "words": [...100 words...]}
+        >>> segment = filter_transcript_by_time(transcript, 0.0, 900.0)  # First 15 minutes
+        >>> # segment contains only words from 0-900 seconds
+    """
+    if not transcript_data or "words" not in transcript_data:
+        return transcript_data
+
+    words = transcript_data.get("words", [])
+
+    if not words:
+        return transcript_data
+
+    # Filter words by time range
+    filtered_words = []
+    for word in words:
+        word_start = word.get("start", 0)
+        word_end = word.get("end", 0)
+
+        # Include word if it overlaps with the time range
+        if word_start < end_time and word_end > start_time:
+            filtered_words.append(word)
+
+    # Rebuild text from filtered words
+    filtered_text = " ".join(word.get("word", "") for word in filtered_words)
+
+    return {
+        "text": filtered_text,
+        "words": filtered_words
+    }
+
+
 async def convert_audio_to_chunks(
     conversation_id: str,
     audio_data: bytes,
@@ -420,6 +568,9 @@ async def convert_audio_to_chunks(
     Returns:
         Number of chunks created
 
+    Raises:
+        ValueError: If audio duration exceeds 30 minutes
+
     Example:
         >>> # Convert from memory without disk write
         >>> num_chunks = await convert_audio_to_chunks(
@@ -436,11 +587,22 @@ async def convert_audio_to_chunks(
 
     logger.info(f"📦 Converting audio to MongoDB chunks: {len(audio_data)} bytes PCM")
 
-    # Calculate chunk size in bytes
+    # Calculate audio duration and validate maximum limit
     bytes_per_second = sample_rate * sample_width * channels
+    total_duration_seconds = len(audio_data) / bytes_per_second
+    MAX_DURATION_SECONDS = 1800  # 30 minutes (180 chunks @ 10s each)
+
+    if total_duration_seconds > MAX_DURATION_SECONDS:
+        raise ValueError(
+            f"Audio duration ({total_duration_seconds:.1f}s) exceeds maximum allowed "
+            f"({MAX_DURATION_SECONDS}s / 30 minutes). Please split the file into smaller segments."
+        )
+
+    # Calculate chunk size in bytes
     chunk_size_bytes = int(chunk_duration * bytes_per_second)
 
-    # Split into chunks and store
+    # Collect all chunks before batch insert
+    chunks_to_insert = []
     chunk_index = 0
     total_original_size = 0
     total_compressed_size = 0
@@ -481,8 +643,8 @@ async def convert_audio_to_chunks(
             channels=channels,
         )
 
-        # Save to MongoDB
-        await audio_chunk.insert()
+        # Add to batch
+        chunks_to_insert.append(audio_chunk)
 
         # Update stats
         total_original_size += len(chunk_pcm)
@@ -491,23 +653,30 @@ async def convert_audio_to_chunks(
         offset = chunk_end
 
         logger.debug(
-            f"💾 Saved chunk {chunk_index}: "
+            f"💾 Prepared chunk {chunk_index}: "
             f"{len(chunk_pcm)} → {len(opus_data)} bytes"
         )
 
+    # Batch insert all chunks to MongoDB (single database operation)
+    if chunks_to_insert:
+        await AudioChunkDocument.insert_many(chunks_to_insert)
+        logger.info(
+            f"✅ Batch inserted {len(chunks_to_insert)} chunks to MongoDB "
+            f"({total_duration_seconds:.1f}s audio)"
+        )
+
     # Update conversation metadata
     conversation = await Conversation.find_one(
         Conversation.conversation_id == conversation_id
     )
 
     if conversation:
-        total_duration = len(audio_data) / bytes_per_second
         compression_ratio = total_compressed_size / total_original_size if total_original_size > 0 else 0.0
 
-        logger.info(f"🔍 DEBUG: Setting metadata - chunks={chunk_index}, duration={total_duration:.2f}s, ratio={compression_ratio:.3f}")
+        logger.info(f"🔍 DEBUG: Setting metadata - chunks={chunk_index}, duration={total_duration_seconds:.2f}s, ratio={compression_ratio:.3f}")
 
         conversation.audio_chunks_count = chunk_index
-        conversation.audio_total_duration = total_duration
+        conversation.audio_total_duration = total_duration_seconds
         conversation.audio_compression_ratio = compression_ratio
 
         logger.info(f"🔍 DEBUG: Before save - chunks={conversation.audio_chunks_count}, duration={conversation.audio_total_duration}")
@@ -550,7 +719,7 @@ async def convert_wav_to_chunks(
 
     Raises:
         FileNotFoundError: If WAV file doesn't exist
-        ValueError: If WAV file is invalid
+        ValueError: If WAV file is invalid or exceeds 30 minutes
 
     Example:
         >>> # Convert uploaded file to chunks
@@ -584,11 +753,22 @@ async def convert_wav_to_chunks(
         f"{sample_rate}Hz, {channels}ch, {sample_width*8}-bit"
     )
 
-    # Calculate chunk size in bytes
+    # Calculate audio duration and validate maximum limit
     bytes_per_second = sample_rate * sample_width * channels
+    total_duration_seconds = len(pcm_data) / bytes_per_second
+    MAX_DURATION_SECONDS = 1800  # 30 minutes (180 chunks @ 10s each)
+
+    if total_duration_seconds > MAX_DURATION_SECONDS:
+        raise ValueError(
+            f"Audio duration ({total_duration_seconds:.1f}s) exceeds maximum allowed "
+            f"({MAX_DURATION_SECONDS}s / 30 minutes). Please split the file into smaller segments."
+        )
+
+    # Calculate chunk size in bytes
     chunk_size_bytes = int(chunk_duration * bytes_per_second)
 
-    # Split into chunks and store
+    # Collect all chunks before batch insert
+    chunks_to_insert = []
     chunk_index = 0
     total_original_size = 0
     total_compressed_size = 0
@@ -629,8 +809,8 @@ async def convert_wav_to_chunks(
             channels=channels,
         )
 
-        # Save to MongoDB
-        await audio_chunk.insert()
+        # Add to batch
+        chunks_to_insert.append(audio_chunk)
 
         # Update stats
         total_original_size += len(chunk_pcm)
@@ -639,23 +819,30 @@ async def convert_wav_to_chunks(
         offset = chunk_end
 
         logger.debug(
-            f"💾 Saved chunk {chunk_index}: "
+            f"💾 Prepared chunk {chunk_index}: "
             f"{len(chunk_pcm)} → {len(opus_data)} bytes"
         )
 
+    # Batch insert all chunks to MongoDB (single database operation)
+    if chunks_to_insert:
+        await AudioChunkDocument.insert_many(chunks_to_insert)
+        logger.info(
+            f"✅ Batch inserted {len(chunks_to_insert)} chunks to MongoDB "
+            f"({total_duration_seconds:.1f}s audio)"
+        )
+
     # Update conversation metadata
     conversation = await Conversation.find_one(
         Conversation.conversation_id == conversation_id
     )
 
     if conversation:
-        total_duration = len(pcm_data) / bytes_per_second
         compression_ratio = total_compressed_size / total_original_size if total_original_size > 0 else 0.0
 
-        logger.info(f"🔍 DEBUG: Setting metadata - chunks={chunk_index}, duration={total_duration:.2f}s, ratio={compression_ratio:.3f}")
+        logger.info(f"🔍 DEBUG: Setting metadata - chunks={chunk_index}, duration={total_duration_seconds:.2f}s, ratio={compression_ratio:.3f}")
 
         conversation.audio_chunks_count = chunk_index
-        conversation.audio_total_duration = total_duration
+        conversation.audio_total_duration = total_duration_seconds
         conversation.audio_compression_ratio = compression_ratio
 
         logger.info(f"🔍 DEBUG: Before save - chunks={conversation.audio_chunks_count}, duration={conversation.audio_total_duration}")
diff --git a/backends/advanced/src/advanced_omi_backend/workers/cleanup_jobs.py b/backends/advanced/src/advanced_omi_backend/workers/cleanup_jobs.py
index e0229457..e470550d 100644
--- a/backends/advanced/src/advanced_omi_backend/workers/cleanup_jobs.py
+++ b/backends/advanced/src/advanced_omi_backend/workers/cleanup_jobs.py
@@ -10,6 +10,7 @@
 
 from advanced_omi_backend.models.conversation import Conversation
 from advanced_omi_backend.models.audio_chunk import AudioChunkDocument
+from advanced_omi_backend.models.waveform import WaveformData
 from advanced_omi_backend.models.job import async_job
 from advanced_omi_backend.config import load_cleanup_settings_from_file
 
@@ -29,7 +30,7 @@ async def purge_old_deleted_conversations(
         dry_run: If True, only count what would be deleted without actually deleting
 
     Returns:
-        Dict with counts of purged conversations and chunks
+        Dict with counts of purged conversations, chunks, and waveforms
     """
     # Get retention period from config if not specified
     if retention_days is None:
@@ -48,6 +49,7 @@ async def purge_old_deleted_conversations(
 
     purged_conversations = 0
     purged_chunks = 0
+    purged_waveforms = 0
 
     for conversation in old_deleted:
         conversation_id = conversation.conversation_id
@@ -59,13 +61,20 @@ async def purge_old_deleted_conversations(
             ).delete()
             purged_chunks += chunk_result.deleted_count
 
+            # Hard delete waveforms
+            waveform_result = await WaveformData.find(
+                WaveformData.conversation_id == conversation_id
+            ).delete()
+            purged_waveforms += waveform_result.deleted_count
+
             # Hard delete conversation
             await conversation.delete()
             purged_conversations += 1
 
             logger.info(
                 f"Purged conversation {conversation_id} "
-                f"(deleted {chunk_result.deleted_count} chunks)"
+                f"(deleted {chunk_result.deleted_count} chunks, "
+                f"{waveform_result.deleted_count} waveforms)"
             )
         else:
             # Dry run - just count
@@ -73,21 +82,29 @@ async def purge_old_deleted_conversations(
                 AudioChunkDocument.conversation_id == conversation_id
             ).count()
             purged_chunks += chunk_count
+
+            waveform_count = await WaveformData.find(
+                WaveformData.conversation_id == conversation_id
+            ).count()
+            purged_waveforms += waveform_count
+
             purged_conversations += 1
 
             logger.info(
                 f"[DRY RUN] Would purge conversation {conversation_id} "
-                f"(with {chunk_count} chunks)"
+                f"(with {chunk_count} chunks, {waveform_count} waveforms)"
             )
 
     logger.info(
         f"{'[DRY RUN] Would purge' if dry_run else 'Purged'} "
-        f"{purged_conversations} conversations and {purged_chunks} chunks"
+        f"{purged_conversations} conversations, {purged_chunks} chunks, "
+        f"and {purged_waveforms} waveforms"
     )
 
     return {
         "purged_conversations": purged_conversations,
         "purged_chunks": purged_chunks,
+        "purged_waveforms": purged_waveforms,
         "retention_days": retention_days,
         "cutoff_date": cutoff_date.isoformat(),
         "dry_run": dry_run,
diff --git a/backends/advanced/src/advanced_omi_backend/workers/conversation_jobs.py b/backends/advanced/src/advanced_omi_backend/workers/conversation_jobs.py
index e9e754bd..764144e5 100644
--- a/backends/advanced/src/advanced_omi_backend/workers/conversation_jobs.py
+++ b/backends/advanced/src/advanced_omi_backend/workers/conversation_jobs.py
@@ -353,7 +353,38 @@ async def open_conversation_job(
 
         # Extract speaker information from segments
         segments = combined.get("segments", [])
-        speakers = extract_speakers_from_segments(segments)
+
+        # FIX: Validate and filter segments before processing
+        validated_segments = []
+        for i, seg in enumerate(segments):
+            # Check if segment is a dict
+            if not isinstance(seg, dict):
+                logger.warning(f"Segment {i} is not a dict: {type(seg)}")
+                continue
+
+            # Check for required text field
+            text = seg.get("text", "").strip()
+            if not text:
+                logger.debug(f"Segment {i} has no text, skipping")
+                continue
+
+            # Check for reasonable timing
+            start = seg.get("start", 0.0)
+            end = seg.get("end", 0.0)
+            if end <= start:
+                logger.debug(f"Segment {i} has invalid timing (start={start}, end={end}), correcting")
+                # Auto-correct: estimate duration from text length
+                estimated_duration = len(text.split()) * 0.5  # ~0.5 seconds per word
+                seg["end"] = start + estimated_duration
+
+            # Ensure speaker field exists
+            if "speaker" not in seg or not seg["speaker"]:
+                seg["speaker"] = "SPEAKER_00"
+
+            validated_segments.append(seg)
+
+        logger.info(f"Validated {len(validated_segments)}/{len(segments)} segments")
+        speakers = extract_speakers_from_segments(validated_segments)
 
         # Track new speech activity (word count based)
         new_speech_time, last_word_count = await track_speech_activity(
@@ -419,7 +450,7 @@ async def open_conversation_job(
         if current_count > last_result_count:
             logger.info(
                 f"📊 Conversation {conversation_id} progress: "
-                f"{current_count} results, {len(combined['text'])} chars, {len(combined['segments'])} segments"
+                f"{current_count} results, {len(combined['text'])} chars, {len(validated_segments)} segments"
             )
             last_result_count = current_count
 
@@ -435,7 +466,7 @@ async def open_conversation_job(
                             'transcript': transcript_text,
                             'segment_id': f"{session_id}_{current_count}",
                             'conversation_id': conversation_id,
-                            'segments': combined.get('segments', []),
+                            'segments': validated_segments,
                             'word_count': speech_analysis.get('word_count', 0),
                         }
 
@@ -536,6 +567,36 @@ async def open_conversation_job(
     transcript_text = final_transcript.get("text", "")
     segments_data = final_transcript.get("segments", [])
 
+    # If streaming provider didn't provide segments (e.g., Deepgram streaming),
+    # create segments from individual final results with word-level data
+    if not segments_data:
+        logger.info(f"📝 No segments in streaming results, creating from word-level data")
+        results = await aggregator.get_session_results(session_id)
+
+        for result in results:
+            words = result.get("words", [])
+            text = result.get("text", "").strip()
+
+            # Skip empty results or results without timing data
+            # WARNING: We don't support results without word-level timing data.
+            # Ideally should error, but skipping for now to handle edge cases gracefully.
+            if not words or not text:
+                continue
+
+            # Create segment dict from this result chunk
+            # Each "final" result becomes one segment with generic speaker label
+            segment_dict = {
+                "start": words[0]["start"],
+                "end": words[-1]["end"],
+                "text": text,
+                "speaker": "SPEAKER_00",  # Generic label, updated by speaker recognition
+                "confidence": result.get("confidence"),
+                "words": words  # Already in correct format from aggregator
+            }
+            segments_data.append(segment_dict)
+
+        logger.info(f"✅ Created {len(segments_data)} segments from streaming results")
+
     # Convert segments to SpeakerSegment format with word-level timestamps
     segments = [
         Conversation.SpeakerSegment(
@@ -566,7 +627,7 @@ async def open_conversation_job(
         transcript=transcript_text,
         segments=segments,
         provider=provider,
-        model=provider_str,  # Provider name as model
+        model=provider,  # Provider name as model
         processing_time_seconds=None,  # Not applicable for streaming
         metadata={
             "source": "streaming",
diff --git a/backends/advanced/src/advanced_omi_backend/workers/speaker_jobs.py b/backends/advanced/src/advanced_omi_backend/workers/speaker_jobs.py
index 3547674a..086b3ae1 100644
--- a/backends/advanced/src/advanced_omi_backend/workers/speaker_jobs.py
+++ b/backends/advanced/src/advanced_omi_backend/workers/speaker_jobs.py
@@ -15,6 +15,88 @@
 logger = logging.getLogger(__name__)
 
 
+def _merge_overlapping_speaker_segments(
+    segments: list[dict],
+    overlap: float
+) -> list[dict]:
+    """
+    Merge speaker segments from overlapping audio chunks.
+
+    This function handles segments that may overlap due to chunked processing,
+    merging segments from the same speaker and resolving conflicts using confidence scores.
+
+    Args:
+        segments: List of speaker segment dicts with start, end, text, speaker, confidence
+        overlap: Overlap duration in seconds used during chunking
+
+    Returns:
+        Merged list of speaker segments
+
+    Example:
+        >>> segments = [
+        ...     {"start": 0, "end": 930, "speaker": "Alice", "text": "...", "confidence": 0.9},
+        ...     {"start": 900, "end": 1830, "speaker": "Alice", "text": "...", "confidence": 0.8},
+        ... ]
+        >>> merged = _merge_overlapping_speaker_segments(segments, overlap=30.0)
+        >>> # Returns single merged segment from Alice
+    """
+    if not segments:
+        return []
+
+    # Sort by start time
+    segments.sort(key=lambda s: s.get("start", 0))
+
+    merged = []
+    current = segments[0].copy()  # Copy to avoid mutating input
+
+    for next_seg in segments[1:]:
+        # Check if segments overlap
+        if next_seg["start"] < current["end"]:
+            # Overlapping - decide how to merge
+            if current.get("speaker") == next_seg.get("speaker"):
+                # Same speaker - merge by extending end time
+                current["end"] = max(current["end"], next_seg["end"])
+
+                # Combine text (avoid duplication in overlap region)
+                current_text = current.get("text", "")
+                next_text = next_seg.get("text", "")
+
+                # Simple text merging - just append if different
+                if next_text and next_text not in current_text:
+                    current["text"] = f"{current_text} {next_text}".strip()
+
+                # Use higher confidence
+                current["confidence"] = max(
+                    current.get("confidence", 0),
+                    next_seg.get("confidence", 0)
+                )
+            else:
+                # Different speakers - use confidence to decide boundary
+                current_conf = current.get("confidence", 0)
+                next_conf = next_seg.get("confidence", 0)
+
+                if next_conf > current_conf:
+                    # Next segment more confident, close current and start new
+                    merged.append(current)
+                    current = next_seg.copy()
+                else:
+                    # Current more confident, adjust next segment start
+                    # Save current, update next to start after current
+                    merged.append(current)
+                    next_seg_copy = next_seg.copy()
+                    next_seg_copy["start"] = current["end"]
+                    current = next_seg_copy
+        else:
+            # No overlap, save current and move to next
+            merged.append(current)
+            current = next_seg.copy()
+
+    # Don't forget last segment
+    merged.append(current)
+
+    return merged
+
+
 @async_job(redis=True, beanie=True)
 async def check_enrolled_speakers_job(
     session_id: str,
@@ -185,52 +267,130 @@ async def recognise_speakers_job(
         }
 
     # Reconstruct audio from MongoDB chunks
-    from advanced_omi_backend.utils.audio_chunk_utils import reconstruct_wav_from_conversation
+    from advanced_omi_backend.utils.audio_chunk_utils import (
+        reconstruct_wav_from_conversation,
+        reconstruct_audio_segments,
+        filter_transcript_by_time
+    )
+    import os
+
+    # Read transcript text and words from the transcript version
+    # (Parameters may be empty if called via job dependency)
+    actual_transcript_text = transcript_text or transcript_version.transcript or ""
+    actual_words = words if words else []
+
+    # If words not provided, we need to get them from metadata
+    if not actual_words and transcript_version.metadata:
+        actual_words = transcript_version.metadata.get("words", [])
+
+    if not actual_transcript_text:
+        logger.warning(f"🎤 No transcript text found in version {version_id}")
+        return {
+            "success": False,
+            "conversation_id": conversation_id,
+            "version_id": version_id,
+            "error": "No transcript text available",
+            "processing_time_seconds": 0
+        }
+
+    transcript_data = {
+        "text": actual_transcript_text,
+        "words": actual_words
+    }
+
+    # Check if we need to use chunked processing
+    total_duration = conversation.audio_total_duration or 0.0
+    chunk_threshold = float(os.getenv("SPEAKER_CHUNK_THRESHOLD", "1500"))  # 25 minutes default
 
     logger.info(f"📦 Reconstructing audio from MongoDB chunks for conversation {conversation_id}")
+    logger.info(f"📊 Total duration: {total_duration:.1f}s, Threshold: {chunk_threshold:.1f}s")
 
     # Call speaker recognition service
     try:
-        # Reconstruct WAV from MongoDB chunks (already in memory as bytes)
-        wav_data = await reconstruct_wav_from_conversation(conversation_id)
+        speaker_segments = []
+
+        if total_duration > chunk_threshold:
+            # Chunked processing for large files
+            logger.info(f"🎤 Using chunked processing for large file ({total_duration:.1f}s > {chunk_threshold:.1f}s)")
+
+            segment_duration = float(os.getenv("SPEAKER_CHUNK_SIZE", "900"))  # 15 minutes default
+            overlap = float(os.getenv("SPEAKER_CHUNK_OVERLAP", "30"))  # 30 seconds default
+
+            async for wav_data, start_time, end_time in reconstruct_audio_segments(
+                conversation_id=conversation_id,
+                segment_duration=segment_duration,
+                overlap=overlap
+            ):
+                logger.info(
+                    f"📦 Processing segment {start_time:.1f}s - {end_time:.1f}s: "
+                    f"{len(wav_data) / 1024 / 1024:.2f} MB"
+                )
 
-        logger.info(
-            f"📦 Reconstructed audio from MongoDB chunks: "
-            f"{len(wav_data) / 1024 / 1024:.2f} MB"
-        )
+                # Filter transcript for this time range
+                segment_transcript = filter_transcript_by_time(
+                    transcript_data,
+                    start_time,
+                    end_time
+                )
 
-        # Read transcript text and words from the transcript version
-        # (Parameters may be empty if called via job dependency)
-        actual_transcript_text = transcript_text or transcript_version.transcript or ""
-        actual_words = words if words else []
+                # Call speaker service for this segment
+                speaker_result = await speaker_client.diarize_identify_match(
+                    audio_data=wav_data,
+                    transcript_data=segment_transcript,
+                    user_id=user_id
+                )
 
-        # If words not provided, we need to get them from metadata
-        if not actual_words and transcript_version.metadata:
-            actual_words = transcript_version.metadata.get("words", [])
+                # Check for errors from speaker service
+                if speaker_result.get("error"):
+                    error_type = speaker_result.get("error")
+                    error_message = speaker_result.get("message", "Unknown error")
+                    logger.error(f"🎤 Speaker service error on segment {start_time:.1f}s: {error_type}")
 
-        if not actual_transcript_text:
-            logger.warning(f"🎤 No transcript text found in version {version_id}")
-            return {
-                "success": False,
-                "conversation_id": conversation_id,
-                "version_id": version_id,
-                "error": "No transcript text available",
-                "processing_time_seconds": 0
-            }
+                    # Raise exception for connection failures
+                    if error_type in ("connection_failed", "timeout", "client_error"):
+                        raise RuntimeError(f"Speaker recognition service unavailable: {error_type} - {error_message}")
 
-        transcript_data = {
-            "text": actual_transcript_text,
-            "words": actual_words
-        }
+                    # For processing errors, continue with other segments
+                    continue
+
+                # Adjust timestamps to global time
+                if speaker_result and "segments" in speaker_result:
+                    for seg in speaker_result["segments"]:
+                        seg["start"] += start_time
+                        seg["end"] += start_time
+
+                    speaker_segments.extend(speaker_result["segments"])
 
-        logger.info(f"🎤 Calling speaker recognition service...")
+            logger.info(f"🎤 Collected {len(speaker_segments)} segments from chunked processing")
 
-        # Call speaker service with in-memory audio data (no temp file needed!)
-        speaker_result = await speaker_client.diarize_identify_match(
-            audio_data=wav_data,  # Pass bytes directly, no disk I/O
-            transcript_data=transcript_data,
-            user_id=user_id
-        )
+            # Merge overlapping segments
+            if speaker_segments:
+                speaker_segments = _merge_overlapping_speaker_segments(speaker_segments, overlap)
+                logger.info(f"🎤 After merging overlaps: {len(speaker_segments)} segments")
+
+            # Package as result dict for consistent handling below
+            speaker_result = {"segments": speaker_segments}
+
+        else:
+            # Normal processing for files <= threshold
+            logger.info(f"🎤 Using normal processing for small file ({total_duration:.1f}s <= {chunk_threshold:.1f}s)")
+
+            # Reconstruct WAV from MongoDB chunks (already in memory as bytes)
+            wav_data = await reconstruct_wav_from_conversation(conversation_id)
+
+            logger.info(
+                f"📦 Reconstructed audio from MongoDB chunks: "
+                f"{len(wav_data) / 1024 / 1024:.2f} MB"
+            )
+
+            logger.info(f"🎤 Calling speaker recognition service...")
+
+            # Call speaker service with in-memory audio data (no temp file needed!)
+            speaker_result = await speaker_client.diarize_identify_match(
+                audio_data=wav_data,  # Pass bytes directly, no disk I/O
+                transcript_data=transcript_data,
+                user_id=user_id
+            )
 
     except ValueError as e:
         # No chunks found for conversation
@@ -296,11 +456,19 @@ async def recognise_speakers_job(
         updated_segments = []
         empty_segment_count = 0
         for seg in speaker_segments:
-            segment_text = seg.get("text", "").strip()
+            # FIX: More robust empty segment detection
+            text = seg.get("text", "").strip()
+
+            # Skip segments with no text, whitespace-only, or very short
+            if not text or len(text) < 3:
+                empty_segment_count += 1
+                logger.debug(f"Filtered empty/short segment: text='{text}'")
+                continue
 
-            # Skip segments with no text
-            if not segment_text:
+            # Skip segments with invalid structure
+            if not isinstance(seg.get("start"), (int, float)) or not isinstance(seg.get("end"), (int, float)):
                 empty_segment_count += 1
+                logger.debug(f"Filtered segment with invalid timing: {seg}")
                 continue
 
             speaker_name = seg.get("identified_as") or seg.get("speaker", "Unknown")
@@ -308,7 +476,7 @@ async def recognise_speakers_job(
                 Conversation.SpeakerSegment(
                     start=seg.get("start", 0),
                     end=seg.get("end", 0),
-                    text=segment_text,
+                    text=text,
                     speaker=speaker_name,
                     confidence=seg.get("confidence")
                 )
diff --git a/backends/advanced/src/advanced_omi_backend/workers/transcription_jobs.py b/backends/advanced/src/advanced_omi_backend/workers/transcription_jobs.py
index 023426df..c8d3c76c 100644
--- a/backends/advanced/src/advanced_omi_backend/workers/transcription_jobs.py
+++ b/backends/advanced/src/advanced_omi_backend/workers/transcription_jobs.py
@@ -603,6 +603,7 @@ async def stream_speech_detection_job(
     # Track when session closes for graceful shutdown
     session_closed_at = None
     final_check_grace_period = 15  # Wait up to 15 seconds for final transcription after session closes
+    last_speech_analysis = None  # Track last analysis for detailed logging
 
     # Main loop: Listen for speech
     while True:
@@ -663,6 +664,7 @@ async def stream_speech_detection_job(
         )
 
         speech_analysis = analyze_speech(transcript_data)
+        last_speech_analysis = speech_analysis  # Track for final logging
 
         logger.info(
             f"🔍 {speech_analysis.get('word_count', 0)} words, "
@@ -671,6 +673,7 @@ async def stream_speech_detection_job(
         )
 
         if not speech_analysis.get("has_speech", False):
+            logger.info(f"⏳ Waiting for more speech - {speech_analysis.get('reason', 'unknown reason')}")
             await asyncio.sleep(2)
             continue
 
@@ -847,11 +850,17 @@ async def stream_speech_detection_job(
         }
 
     # Session ended without speech
-    logger.info(f"✅ Session ended without speech")
+    reason = last_speech_analysis.get('reason', 'No transcription received') if last_speech_analysis else 'No transcription received'
+    logger.warning(
+        f"❌ Session ended without meaningful speech detected\n"
+        f"   Reason: {reason}\n"
+        f"   Runtime: {time.time() - start_time:.1f}s"
+    )
     return {
         "session_id": session_id,
         "user_id": user_id,
         "client_id": client_id,
         "no_speech_detected": True,
+        "reason": reason,
         "runtime_seconds": time.time() - start_time,
     }
diff --git a/backends/advanced/src/advanced_omi_backend/workers/waveform_jobs.py b/backends/advanced/src/advanced_omi_backend/workers/waveform_jobs.py
new file mode 100644
index 00000000..911b651d
--- /dev/null
+++ b/backends/advanced/src/advanced_omi_backend/workers/waveform_jobs.py
@@ -0,0 +1,190 @@
+"""
+Waveform generation workers for audio visualization.
+
+This module provides async functions to generate waveform data from
+audio chunks stored in MongoDB. Waveforms are computed on-demand
+and cached for subsequent requests.
+"""
+
+import logging
+import struct
+import time
+from typing import Dict, Any, List
+
+logger = logging.getLogger(__name__)
+
+
+async def generate_waveform_data(
+    conversation_id: str,
+    sample_rate: int = 3,
+) -> Dict[str, Any]:
+    """
+    Generate waveform visualization data from conversation audio chunks.
+
+    This function:
+    1. Retrieves Opus-compressed audio chunks from MongoDB
+    2. Decodes each chunk to PCM
+    3. Downsamples PCM to target sample rate (e.g., 10 samples/sec)
+    4. Calculates amplitude peaks for each sample window
+    5. Normalizes to [-1.0, 1.0] range
+    6. Stores in WaveformData collection
+
+    Args:
+        conversation_id: Conversation ID to generate waveform for
+        sample_rate: Samples per second for waveform (default: 10)
+
+    Returns:
+        Dict with:
+            - success: bool
+            - samples: List[float] (if successful)
+            - sample_rate: int (if successful)
+            - duration_seconds: float (if successful)
+            - error: str (if failed)
+    """
+    from advanced_omi_backend.models.waveform import WaveformData
+    from advanced_omi_backend.utils.audio_chunk_utils import (
+        retrieve_audio_chunks,
+        decode_opus_to_pcm,
+    )
+
+    start_time = time.time()
+    fetch_time = 0.0
+    decode_time = 0.0
+    waveform_gen_time = 0.0
+
+    try:
+        logger.info(f"🎵 Generating waveform for conversation {conversation_id[:12]}... (sample_rate={sample_rate} samples/sec)")
+
+        # Retrieve all audio chunks for conversation
+        fetch_start = time.time()
+        chunks = await retrieve_audio_chunks(conversation_id=conversation_id)
+        fetch_time = time.time() - fetch_start
+
+        logger.info(f"📦 Fetched {len(chunks) if chunks else 0} chunks from MongoDB in {fetch_time:.2f}s")
+
+        if not chunks:
+            logger.warning(f"No audio chunks found for conversation {conversation_id}")
+            return {
+                "success": False,
+                "error": "No audio chunks found for this conversation"
+            }
+
+        # Get audio format from first chunk
+        pcm_sample_rate = chunks[0].sample_rate  # Usually 16000 Hz
+        channels = chunks[0].channels  # Usually 1 (mono)
+        bytes_per_sample = 2  # 16-bit PCM
+
+        # Calculate total duration
+        total_duration = sum(chunk.duration for chunk in chunks)
+
+        # Calculate window size for downsampling
+        # e.g., 16000 samples/sec ÷ 10 waveform_samples/sec = 1600 PCM samples per waveform point
+        window_size_samples = pcm_sample_rate // sample_rate
+        bytes_per_window = window_size_samples * bytes_per_sample * channels
+
+        logger.info(
+            f"Processing {len(chunks)} chunks, "
+            f"total duration: {total_duration:.1f}s, "
+            f"window size: {window_size_samples} samples"
+        )
+
+        # Process chunks and extract amplitude peaks
+        waveform_samples: List[float] = []
+
+        for chunk_idx, chunk in enumerate(chunks):
+            # Decode Opus to PCM
+            decode_start = time.time()
+            pcm_data = await decode_opus_to_pcm(
+                opus_data=chunk.audio_data,
+                sample_rate=pcm_sample_rate,
+                channels=channels,
+            )
+            decode_time += time.time() - decode_start
+
+            # Process PCM data in windows
+            waveform_gen_start = time.time()
+            offset = 0
+            while offset < len(pcm_data):
+                # Extract window
+                window_end = min(offset + bytes_per_window, len(pcm_data))
+                window_bytes = pcm_data[offset:window_end]
+
+                if len(window_bytes) == 0:
+                    break
+
+                # Convert bytes to signed 16-bit integers
+                num_samples_in_window = len(window_bytes) // bytes_per_sample
+                format_str = f"{num_samples_in_window}h"  # 'h' = signed short (16-bit)
+
+                try:
+                    pcm_samples = struct.unpack(format_str, window_bytes)
+                except struct.error as e:
+                    logger.warning(f"Struct unpack error: {e}, skipping window")
+                    offset += bytes_per_window
+                    continue
+
+                # Calculate peak amplitude in this window
+                # Normalize from 16-bit range (-32768 to 32767) to [-1.0, 1.0]
+                if pcm_samples:
+                    max_abs_amplitude = max(abs(s) for s in pcm_samples)
+                    normalized_amplitude = max_abs_amplitude / 32768.0
+                    waveform_samples.append(normalized_amplitude)
+
+                offset += bytes_per_window
+
+            waveform_gen_time += time.time() - waveform_gen_start
+
+            # Log progress for long conversations
+            if (chunk_idx + 1) % 20 == 0:
+                logger.info(
+                    f"Processed {chunk_idx + 1}/{len(chunks)} chunks "
+                    f"({len(waveform_samples)} waveform samples so far)"
+                )
+
+        processing_time = time.time() - start_time
+        other_time = processing_time - (fetch_time + decode_time + waveform_gen_time)
+
+        logger.info(
+            f"✅ Generated waveform: {len(waveform_samples)} samples "
+            f"for {total_duration:.1f}s audio in {processing_time:.2f}s total"
+        )
+        logger.info(
+            f"   ⏱️  Timing breakdown: "
+            f"Fetch={fetch_time:.2f}s, "
+            f"Decode={decode_time:.2f}s, "
+            f"Waveform={waveform_gen_time:.2f}s, "
+            f"Other={other_time:.2f}s"
+        )
+
+        # Store in MongoDB
+        waveform_doc = WaveformData(
+            conversation_id=conversation_id,
+            samples=waveform_samples,
+            sample_rate=sample_rate,
+            duration_seconds=total_duration,
+            processing_time_seconds=processing_time
+        )
+
+        await waveform_doc.insert()
+
+        logger.info(f"💾 Saved waveform to MongoDB for conversation {conversation_id[:12]}")
+
+        return {
+            "success": True,
+            "samples": waveform_samples,
+            "sample_rate": sample_rate,
+            "duration_seconds": total_duration,
+            "processing_time_seconds": processing_time
+        }
+
+    except Exception as e:
+        processing_time = time.time() - start_time
+        logger.error(
+            f"❌ Waveform generation failed for {conversation_id}: {e}",
+            exc_info=True
+        )
+        return {
+            "success": False,
+            "error": str(e),
+            "processing_time_seconds": processing_time
+        }
diff --git a/backends/advanced/src/scripts/cleanup_state.py b/backends/advanced/src/scripts/cleanup_state.py
new file mode 100644
index 00000000..d837fe56
--- /dev/null
+++ b/backends/advanced/src/scripts/cleanup_state.py
@@ -0,0 +1,912 @@
+#!/usr/bin/env python3
+"""
+Backend State Cleanup Script for Chronicle
+
+This script provides comprehensive cleanup of Chronicle backend data including:
+- MongoDB collections (conversations, audio_chunks)
+- Qdrant vector store (memories)
+- Redis job queues and registries
+- Legacy WAV files (backward compatibility)
+
+Features:
+- Optional backup before cleanup (metadata and/or full audio export)
+- Dry-run mode for safe preview
+- User account preservation by default
+- Confirmation prompts with detailed warnings
+"""
+
+import asyncio
+import argparse
+import json
+import logging
+import os
+import shutil
+import sys
+from datetime import datetime
+from pathlib import Path
+from typing import Dict, List, Any, Optional, Tuple
+import struct
+
+# Add parent directory to path for imports
+sys.path.insert(0, str(Path(__file__).parent.parent.parent))
+
+try:
+    import redis
+    from rq import Queue
+    from motor.motor_asyncio import AsyncIOMotorClient
+    from qdrant_client import AsyncQdrantClient
+    from qdrant_client.models import Distance, VectorParams
+    from beanie import init_beanie
+    from advanced_omi_backend.models.conversation import Conversation
+    from advanced_omi_backend.models.audio_chunk import AudioChunkDocument
+    from advanced_omi_backend.models.user import User
+    from advanced_omi_backend.models.waveform import WaveformData
+    from advanced_omi_backend.services.memory.config import build_memory_config_from_env
+except ImportError as e:
+    print(f"Error: Missing required dependency: {e}")
+    print("This script must be run inside the chronicle-backend container")
+    sys.exit(1)
+
+# Configure logging
+logging.basicConfig(
+    level=logging.INFO,
+    format='%(asctime)s - %(levelname)s - %(message)s'
+)
+logger = logging.getLogger(__name__)
+
+
+def get_qdrant_collection_name() -> str:
+    """Get Qdrant collection name from memory service configuration."""
+    try:
+        memory_config = build_memory_config_from_env()
+        if hasattr(memory_config, 'vector_store_config') and memory_config.vector_store_config:
+            collection_name = memory_config.vector_store_config.get('collection_name', 'chronicle_memories')
+            logger.info(f"Using Qdrant collection name from config: {collection_name}")
+            return collection_name
+    except Exception as e:
+        logger.warning(f"Could not load collection name from config: {e}")
+
+    # Fallback to default
+    logger.info("Using default Qdrant collection name: chronicle_memories")
+    return "chronicle_memories"
+
+
+class CleanupStats:
+    """Track cleanup statistics"""
+    def __init__(self):
+        self.conversations_count = 0
+        self.audio_chunks_count = 0
+        self.waveforms_count = 0
+        self.chat_sessions_count = 0
+        self.chat_messages_count = 0
+        self.memories_count = 0
+        self.redis_jobs_count = 0
+        self.legacy_wav_count = 0
+        self.users_count = 0
+        self.backup_size_bytes = 0
+        self.backup_path = None
+
+
+class BackupManager:
+    """Handle backup operations"""
+
+    def __init__(self, backup_dir: str, export_audio: bool, mongo_db: Any):
+        self.backup_dir = Path(backup_dir)
+        self.export_audio = export_audio
+        self.mongo_db = mongo_db
+        self.timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
+        self.backup_path = self.backup_dir / f"backup_{self.timestamp}"
+
+    async def create_backup(
+        self,
+        qdrant_client: Optional[AsyncQdrantClient],
+        stats: CleanupStats
+    ) -> bool:
+        """Create complete backup of all data"""
+        try:
+            logger.info(f"Creating backup at {self.backup_path}")
+            self.backup_path.mkdir(parents=True, exist_ok=True)
+            stats.backup_path = str(self.backup_path)
+
+            # Export MongoDB data
+            await self._export_conversations(stats)
+            await self._export_audio_chunks_metadata(stats)
+            await self._export_waveforms(stats)
+            await self._export_chat_sessions(stats)
+            await self._export_chat_messages(stats)
+
+            # Export audio as WAV if requested
+            if self.export_audio:
+                await self._export_audio_wav(stats)
+
+            # Export Qdrant vectors
+            if qdrant_client:
+                await self._export_memories(qdrant_client, stats)
+
+            # Generate summary
+            await self._generate_summary(stats)
+
+            # Calculate backup size
+            stats.backup_size_bytes = sum(
+                f.stat().st_size for f in self.backup_path.rglob('*') if f.is_file()
+            )
+
+            logger.info(f"Backup completed: {stats.backup_size_bytes / (1024**2):.2f} MB")
+            return True
+
+        except Exception as e:
+            logger.error(f"Backup failed: {e}", exc_info=True)
+            return False
+
+    async def _export_conversations(self, stats: CleanupStats):
+        """Export all conversations to JSON"""
+        logger.info("Exporting conversations...")
+        conversations = await Conversation.find_all().to_list()
+        stats.conversations_count = len(conversations)
+
+        # Serialize conversations (handle datetime, UUID, etc.)
+        conversations_data = []
+        for conv in conversations:
+            conv_dict = conv.model_dump(mode='json')
+            conversations_data.append(conv_dict)
+
+        output_path = self.backup_path / "conversations.json"
+        with open(output_path, 'w') as f:
+            json.dump(conversations_data, f, indent=2, default=str)
+
+        logger.info(f"Exported {stats.conversations_count} conversations")
+
+    async def _export_audio_chunks_metadata(self, stats: CleanupStats):
+        """Export audio chunks metadata (not the actual audio)"""
+        logger.info("Exporting audio chunks metadata...")
+
+        # Use raw MongoDB query to handle malformed documents
+        # (some old/corrupted chunks may not validate against current schema)
+        audio_chunks_collection = self.mongo_db["audio_chunks"]
+        chunks_cursor = audio_chunks_collection.find({})
+
+        chunks_data = []
+        malformed_count = 0
+
+        async for chunk in chunks_cursor:
+            try:
+                # Extract fields safely with defaults for missing values
+                chunk_dict = {
+                    'conversation_id': chunk.get('conversation_id'),
+                    'chunk_index': chunk.get('chunk_index'),
+                    'start_time': chunk.get('start_time'),
+                    'end_time': chunk.get('end_time'),
+                    'duration': chunk.get('duration'),
+                    'original_size': chunk.get('original_size'),
+                    'compressed_size': chunk.get('compressed_size'),
+                    'sample_rate': chunk.get('sample_rate', 16000),
+                    'channels': chunk.get('channels', 1),
+                    'has_speech': chunk.get('has_speech'),
+                    'created_at': str(chunk.get('created_at', ''))
+                }
+                chunks_data.append(chunk_dict)
+            except Exception as e:
+                malformed_count += 1
+                logger.warning(f"Skipping malformed chunk {chunk.get('_id')}: {e}")
+                continue
+
+        stats.audio_chunks_count = len(chunks_data)
+
+        output_path = self.backup_path / "audio_chunks_metadata.json"
+        with open(output_path, 'w') as f:
+            json.dump(chunks_data, f, indent=2, default=str)
+
+        logger.info(f"Exported {stats.audio_chunks_count} audio chunks metadata")
+        if malformed_count > 0:
+            logger.warning(f"Skipped {malformed_count} malformed chunks")
+
+    async def _export_waveforms(self, stats: CleanupStats):
+        """Export waveform visualization data"""
+        logger.info("Exporting waveforms...")
+
+        waveforms = await WaveformData.find_all().to_list()
+        stats.waveforms_count = len(waveforms)
+
+        # Serialize waveforms
+        waveforms_data = []
+        for waveform in waveforms:
+            waveform_dict = waveform.model_dump(mode='json')
+            waveforms_data.append(waveform_dict)
+
+        output_path = self.backup_path / "waveforms.json"
+        with open(output_path, 'w') as f:
+            json.dump(waveforms_data, f, indent=2, default=str)
+
+        logger.info(f"Exported {stats.waveforms_count} waveforms")
+
+    async def _export_chat_sessions(self, stats: CleanupStats):
+        """Export chat sessions metadata"""
+        logger.info("Exporting chat sessions...")
+
+        chat_sessions_collection = self.mongo_db["chat_sessions"]
+        sessions_cursor = chat_sessions_collection.find({})
+
+        sessions_data = []
+        async for session in sessions_cursor:
+            session_dict = {
+                'session_id': session.get('session_id'),
+                'user_id': session.get('user_id'),
+                'title': session.get('title'),
+                'created_at': str(session.get('created_at', '')),
+                'updated_at': str(session.get('updated_at', '')),
+                'metadata': session.get('metadata', {})
+            }
+            sessions_data.append(session_dict)
+
+        stats.chat_sessions_count = len(sessions_data)
+
+        output_path = self.backup_path / "chat_sessions.json"
+        with open(output_path, 'w') as f:
+            json.dump(sessions_data, f, indent=2, default=str)
+
+        logger.info(f"Exported {stats.chat_sessions_count} chat sessions")
+
+    async def _export_chat_messages(self, stats: CleanupStats):
+        """Export chat messages"""
+        logger.info("Exporting chat messages...")
+
+        chat_messages_collection = self.mongo_db["chat_messages"]
+        messages_cursor = chat_messages_collection.find({})
+
+        messages_data = []
+        async for message in messages_cursor:
+            message_dict = {
+                'message_id': message.get('message_id'),
+                'session_id': message.get('session_id'),
+                'user_id': message.get('user_id'),
+                'role': message.get('role'),
+                'content': message.get('content'),
+                'timestamp': str(message.get('timestamp', '')),
+                'memories_used': message.get('memories_used', []),
+                'metadata': message.get('metadata', {})
+            }
+            messages_data.append(message_dict)
+
+        stats.chat_messages_count = len(messages_data)
+
+        output_path = self.backup_path / "chat_messages.json"
+        with open(output_path, 'w') as f:
+            json.dump(messages_data, f, indent=2, default=str)
+
+        logger.info(f"Exported {stats.chat_messages_count} chat messages")
+
+    async def _export_audio_wav(self, stats: CleanupStats):
+        """Export audio as WAV files (1-minute chunks)"""
+        logger.info("Exporting audio as WAV files (this may take a while)...")
+
+        # Get all unique conversation IDs
+        conversations = await Conversation.find_all().to_list()
+        audio_dir = self.backup_path / "audio"
+
+        for conv in conversations:
+            try:
+                await self._export_conversation_audio(conv.conversation_id, audio_dir)
+            except Exception as e:
+                logger.warning(f"Failed to export audio for {conv.conversation_id}: {e}")
+                continue
+
+        logger.info("Audio export completed")
+
+    async def _export_conversation_audio(self, conversation_id: str, audio_dir: Path):
+        """Export audio for a single conversation as 1-minute WAV chunks"""
+        # Get all chunks for this conversation
+        chunks = await AudioChunkDocument.find(
+            AudioChunkDocument.conversation_id == conversation_id
+        ).sort("+chunk_index").to_list()
+
+        if not chunks:
+            return
+
+        # Create conversation directory
+        conv_dir = audio_dir / conversation_id
+        conv_dir.mkdir(parents=True, exist_ok=True)
+
+        # Decode all Opus chunks to PCM
+        pcm_data = []
+        sample_rate = chunks[0].sample_rate
+        channels = chunks[0].channels
+
+        try:
+            import opuslib
+            decoder = opuslib.Decoder(sample_rate, channels)
+
+            for chunk in chunks:
+                # Decode Opus to PCM
+                # Note: frame_size depends on sample rate and duration
+                frame_size = int(sample_rate * chunk.duration / channels)
+                decoded = decoder.decode(bytes(chunk.audio_data), frame_size)
+                pcm_data.append(decoded)
+
+        except ImportError:
+            logger.warning("opuslib not available, skipping audio export")
+            return
+        except Exception as e:
+            logger.warning(f"Failed to decode audio for {conversation_id}: {e}")
+            return
+
+        # Concatenate all PCM data
+        all_pcm = b''.join(pcm_data)
+
+        # Convert bytes to int16 samples
+        samples = struct.unpack(f'<{len(all_pcm)//2}h', all_pcm)
+
+        # Split into 1-minute chunks
+        samples_per_minute = sample_rate * 60 * channels
+        chunk_num = 1
+
+        for start_idx in range(0, len(samples), samples_per_minute):
+            chunk_samples = samples[start_idx:start_idx + samples_per_minute]
+
+            # Write WAV file
+            wav_path = conv_dir / f"chunk_{chunk_num:03d}.wav"
+            self._write_wav(wav_path, sample_rate, channels, chunk_samples)
+            chunk_num += 1
+
+    def _write_wav(self, path: Path, sample_rate: int, channels: int, samples: Tuple[int, ...]):
+        """Write PCM samples to WAV file"""
+        import wave
+
+        with wave.open(str(path), 'wb') as wav_file:
+            wav_file.setnchannels(channels)
+            wav_file.setsampwidth(2)  # 16-bit
+            wav_file.setframerate(sample_rate)
+
+            # Convert samples back to bytes
+            pcm_bytes = struct.pack(f'<{len(samples)}h', *samples)
+            wav_file.writeframes(pcm_bytes)
+
+    async def _export_memories(self, qdrant_client: AsyncQdrantClient, stats: CleanupStats):
+        """Export Qdrant vectors to JSON"""
+        logger.info("Exporting memories from Qdrant...")
+
+        try:
+            collection_name = get_qdrant_collection_name()
+
+            # Check if collection exists
+            collections = await qdrant_client.get_collections()
+            collection_exists = any(
+                col.name == collection_name
+                for col in collections.collections
+            )
+
+            if not collection_exists:
+                logger.info("Memories collection does not exist, skipping export")
+                return
+
+            # Scroll through all vectors
+            memories_data = []
+            offset = None
+
+            while True:
+                result = await qdrant_client.scroll(
+                    collection_name=collection_name,
+                    limit=100,
+                    offset=offset,
+                    with_payload=True,
+                    with_vectors=True
+                )
+
+                points, next_offset = result
+
+                if not points:
+                    break
+
+                for point in points:
+                    memory_dict = {
+                        'id': str(point.id),
+                        'vector': point.vector,
+                        'payload': point.payload
+                    }
+                    memories_data.append(memory_dict)
+
+                if next_offset is None:
+                    break
+
+                offset = next_offset
+
+            stats.memories_count = len(memories_data)
+
+            output_path = self.backup_path / "memories.json"
+            with open(output_path, 'w') as f:
+                json.dump(memories_data, f, indent=2)
+
+            logger.info(f"Exported {stats.memories_count} memories")
+
+        except Exception as e:
+            logger.warning(f"Failed to export memories: {e}")
+
+    async def _generate_summary(self, stats: CleanupStats):
+        """Generate backup summary"""
+        summary = {
+            'timestamp': self.timestamp,
+            'backup_path': str(self.backup_path),
+            'total_conversations': stats.conversations_count,
+            'total_audio_chunks': stats.audio_chunks_count,
+            'total_waveforms': stats.waveforms_count,
+            'total_chat_sessions': stats.chat_sessions_count,
+            'total_chat_messages': stats.chat_messages_count,
+            'total_memories': stats.memories_count,
+            'audio_exported': self.export_audio,
+            'backup_size_bytes': 0  # Will be calculated after all files written
+        }
+
+        output_path = self.backup_path / "backup_summary.json"
+        with open(output_path, 'w') as f:
+            json.dump(summary, f, indent=2)
+
+
+class CleanupManager:
+    """Handle cleanup operations"""
+
+    def __init__(
+        self,
+        mongo_db: Any,
+        redis_conn: Any,
+        qdrant_client: Optional[AsyncQdrantClient],
+        include_wav: bool,
+        delete_users: bool
+    ):
+        self.mongo_db = mongo_db
+        self.redis_conn = redis_conn
+        self.qdrant_client = qdrant_client
+        self.include_wav = include_wav
+        self.delete_users = delete_users
+
+    async def perform_cleanup(self, stats: CleanupStats) -> bool:
+        """Perform all cleanup operations"""
+        try:
+            logger.info("Starting cleanup operations...")
+
+            # MongoDB cleanup
+            await self._cleanup_mongodb(stats)
+
+            # Qdrant cleanup
+            if self.qdrant_client:
+                await self._cleanup_qdrant(stats)
+
+            # Redis cleanup
+            self._cleanup_redis(stats)
+
+            # Legacy WAV cleanup
+            if self.include_wav:
+                self._cleanup_legacy_wav(stats)
+
+            logger.info("Cleanup completed successfully")
+            return True
+
+        except Exception as e:
+            logger.error(f"Cleanup failed: {e}", exc_info=True)
+            return False
+
+    async def _cleanup_mongodb(self, stats: CleanupStats):
+        """Clean MongoDB collections"""
+        logger.info("Cleaning MongoDB collections...")
+
+        # Count before deletion
+        stats.conversations_count = await Conversation.find_all().count()
+        # Use raw MongoDB count to handle malformed documents
+        stats.audio_chunks_count = await self.mongo_db["audio_chunks"].count_documents({})
+        stats.waveforms_count = await WaveformData.find_all().count()
+        stats.chat_sessions_count = await self.mongo_db["chat_sessions"].count_documents({})
+        stats.chat_messages_count = await self.mongo_db["chat_messages"].count_documents({})
+
+        if self.delete_users:
+            stats.users_count = await User.find_all().count()
+
+        # Delete conversations
+        result = await Conversation.find_all().delete()
+        logger.info(f"Deleted {stats.conversations_count} conversations")
+
+        # Delete audio chunks using raw MongoDB to handle malformed documents
+        result = await self.mongo_db["audio_chunks"].delete_many({})
+        logger.info(f"Deleted {stats.audio_chunks_count} audio chunks")
+
+        # Delete waveforms
+        result = await WaveformData.find_all().delete()
+        logger.info(f"Deleted {stats.waveforms_count} waveforms")
+
+        # Delete chat sessions
+        result = await self.mongo_db["chat_sessions"].delete_many({})
+        logger.info(f"Deleted {stats.chat_sessions_count} chat sessions")
+
+        # Delete chat messages
+        result = await self.mongo_db["chat_messages"].delete_many({})
+        logger.info(f"Deleted {stats.chat_messages_count} chat messages")
+
+        # Delete users if requested
+        if self.delete_users:
+            result = await User.find_all().delete()
+            logger.info(f"DANGEROUS: Deleted {stats.users_count} users")
+
+    async def _cleanup_qdrant(self, stats: CleanupStats):
+        """Clean Qdrant vector store"""
+        logger.info("Cleaning Qdrant memories...")
+
+        try:
+            collection_name = get_qdrant_collection_name()
+
+            # Check if collection exists
+            collections = await self.qdrant_client.get_collections()
+            collection_exists = any(
+                col.name == collection_name
+                for col in collections.collections
+            )
+
+            if not collection_exists:
+                logger.info("Memories collection does not exist, skipping cleanup")
+                return
+
+            # Get count before deletion
+            collection_info = await self.qdrant_client.get_collection(collection_name)
+            stats.memories_count = collection_info.points_count
+
+            # Delete and recreate collection
+            await self.qdrant_client.delete_collection(collection_name)
+            logger.info(f"Deleted memories collection ({stats.memories_count} vectors)")
+
+            # Recreate with default configuration
+            await self.qdrant_client.create_collection(
+                collection_name=collection_name,
+                vectors_config=VectorParams(size=1536, distance=Distance.COSINE)
+            )
+            logger.info("Recreated memories collection")
+
+        except Exception as e:
+            logger.warning(f"Failed to clean Qdrant: {e}")
+
+    def _cleanup_redis(self, stats: CleanupStats):
+        """Clean Redis job queues"""
+        logger.info("Cleaning Redis job queues...")
+
+        try:
+            queue_names = ["transcription", "memory", "audio", "default"]
+            total_jobs = 0
+
+            for queue_name in queue_names:
+                queue = Queue(queue_name, connection=self.redis_conn)
+
+                # Count jobs
+                job_count = (
+                    len(queue) +
+                    len(queue.started_job_registry) +
+                    len(queue.finished_job_registry) +
+                    len(queue.failed_job_registry) +
+                    len(queue.canceled_job_registry) +
+                    len(queue.deferred_job_registry) +
+                    len(queue.scheduled_job_registry)
+                )
+                total_jobs += job_count
+
+                # Clear queue and registries
+                queue.empty()
+
+                # Clear job registries (they don't have clear() method in all RQ versions)
+                # So we manually remove all job IDs
+                for job_id in queue.started_job_registry.get_job_ids():
+                    queue.started_job_registry.remove(job_id)
+                for job_id in queue.finished_job_registry.get_job_ids():
+                    queue.finished_job_registry.remove(job_id)
+                for job_id in queue.failed_job_registry.get_job_ids():
+                    queue.failed_job_registry.remove(job_id)
+                for job_id in queue.canceled_job_registry.get_job_ids():
+                    queue.canceled_job_registry.remove(job_id)
+                for job_id in queue.deferred_job_registry.get_job_ids():
+                    queue.deferred_job_registry.remove(job_id)
+                for job_id in queue.scheduled_job_registry.get_job_ids():
+                    queue.scheduled_job_registry.remove(job_id)
+
+                logger.info(f"Cleared {queue_name} queue ({job_count} jobs)")
+
+            stats.redis_jobs_count = total_jobs
+            logger.info(f"Cleared total of {total_jobs} Redis jobs")
+
+        except Exception as e:
+            logger.warning(f"Failed to clean Redis: {e}")
+
+    def _cleanup_legacy_wav(self, stats: CleanupStats):
+        """Clean legacy WAV files"""
+        logger.info("Cleaning legacy WAV files...")
+
+        try:
+            wav_dir = Path("/app/data/audio_chunks")
+
+            if not wav_dir.exists():
+                logger.info("Legacy WAV directory does not exist, skipping")
+                return
+
+            wav_files = list(wav_dir.glob("*.wav"))
+            stats.legacy_wav_count = len(wav_files)
+
+            for wav_file in wav_files:
+                wav_file.unlink()
+
+            logger.info(f"Deleted {stats.legacy_wav_count} legacy WAV files")
+
+        except Exception as e:
+            logger.warning(f"Failed to clean legacy WAV files: {e}")
+
+
+async def get_current_stats(
+    mongo_db: Any,
+    redis_conn: Any,
+    qdrant_client: Optional[AsyncQdrantClient]
+) -> CleanupStats:
+    """Get current statistics before cleanup"""
+    stats = CleanupStats()
+
+    # MongoDB counts
+    stats.conversations_count = await Conversation.find_all().count()
+    # Use raw MongoDB count to handle malformed documents
+    stats.audio_chunks_count = await mongo_db["audio_chunks"].count_documents({})
+    stats.waveforms_count = await WaveformData.find_all().count()
+    stats.chat_sessions_count = await mongo_db["chat_sessions"].count_documents({})
+    stats.chat_messages_count = await mongo_db["chat_messages"].count_documents({})
+    stats.users_count = await User.find_all().count()
+
+    # Qdrant count
+    if qdrant_client:
+        try:
+            collection_name = get_qdrant_collection_name()
+            collection_info = await qdrant_client.get_collection(collection_name)
+            stats.memories_count = collection_info.points_count
+        except Exception:
+            stats.memories_count = 0
+
+    # Redis count
+    try:
+        queue_names = ["transcription", "memory", "audio", "default"]
+        total_jobs = 0
+        for queue_name in queue_names:
+            queue = Queue(queue_name, connection=redis_conn)
+            total_jobs += (
+                len(queue) +
+                len(queue.started_job_registry) +
+                len(queue.finished_job_registry) +
+                len(queue.failed_job_registry) +
+                len(queue.canceled_job_registry) +
+                len(queue.deferred_job_registry) +
+                len(queue.scheduled_job_registry)
+            )
+        stats.redis_jobs_count = total_jobs
+    except Exception:
+        stats.redis_jobs_count = 0
+
+    # Legacy WAV count
+    wav_dir = Path("/app/data/audio_chunks")
+    if wav_dir.exists():
+        stats.legacy_wav_count = len(list(wav_dir.glob("*.wav")))
+
+    return stats
+
+
+def print_stats(stats: CleanupStats, title: str = "Current State"):
+    """Print statistics in a formatted way"""
+    print(f"\n{'='*60}")
+    print(f"{title:^60}")
+    print(f"{'='*60}")
+    print(f"Conversations:        {stats.conversations_count:>10}")
+    print(f"Audio Chunks:         {stats.audio_chunks_count:>10}")
+    print(f"Waveforms:            {stats.waveforms_count:>10}")
+    print(f"Chat Sessions:        {stats.chat_sessions_count:>10}")
+    print(f"Chat Messages:        {stats.chat_messages_count:>10}")
+    print(f"Memories (Qdrant):    {stats.memories_count:>10}")
+    print(f"Redis Jobs:           {stats.redis_jobs_count:>10}")
+    print(f"Legacy WAV Files:     {stats.legacy_wav_count:>10}")
+    print(f"Users:                {stats.users_count:>10}")
+    if stats.backup_path:
+        print(f"\nBackup Location:      {stats.backup_path}")
+        if stats.backup_size_bytes > 0:
+            size_mb = stats.backup_size_bytes / (1024**2)
+            print(f"Backup Size:          {size_mb:>10.2f} MB")
+    print(f"{'='*60}\n")
+
+
+def confirm_action(message: str) -> bool:
+    """Ask for user confirmation"""
+    response = input(f"{message} (yes/no): ").strip().lower()
+    return response == 'yes'
+
+
+async def main():
+    parser = argparse.ArgumentParser(
+        description='Clean Chronicle backend state with optional backup',
+        formatter_class=argparse.RawDescriptionHelpFormatter,
+        epilog="""
+Examples:
+  # Dry-run to see what would be deleted
+  python cleanup_state.py --dry-run
+
+  # Safe cleanup with metadata backup
+  python cleanup_state.py --backup
+
+  # Full backup including audio export
+  python cleanup_state.py --backup --export-audio
+
+  # Automated cleanup without confirmation
+  python cleanup_state.py --backup --force
+        """
+    )
+
+    parser.add_argument(
+        '--backup',
+        action='store_true',
+        help='Create backup before cleaning (metadata only by default)'
+    )
+    parser.add_argument(
+        '--export-audio',
+        action='store_true',
+        help='Include audio WAV export in backup (can be large, requires --backup)'
+    )
+    parser.add_argument(
+        '--include-wav',
+        action='store_true',
+        help='Include legacy WAV file cleanup (backward compat)'
+    )
+    parser.add_argument(
+        '--dry-run',
+        action='store_true',
+        help='Show what would be cleaned without deleting'
+    )
+    parser.add_argument(
+        '--force',
+        action='store_true',
+        help='Skip confirmation prompt'
+    )
+    parser.add_argument(
+        '--backup-dir',
+        type=str,
+        default='/app/data/backups',
+        help='Backup directory location (default: /app/data/backups)'
+    )
+    parser.add_argument(
+        '--delete-users',
+        action='store_true',
+        help='DANGEROUS: Also delete user accounts'
+    )
+
+    args = parser.parse_args()
+
+    # Validate arguments
+    if args.export_audio and not args.backup:
+        logger.error("--export-audio requires --backup")
+        sys.exit(1)
+
+    # Initialize connections
+    logger.info("Connecting to services...")
+
+    # MongoDB
+    mongodb_uri = os.getenv("MONGODB_URI", "mongodb://mongo:27017")
+    mongodb_database = os.getenv("MONGODB_DATABASE", "chronicle")
+    mongo_client = AsyncIOMotorClient(mongodb_uri)
+    mongo_db = mongo_client[mongodb_database]
+
+    # Initialize Beanie
+    await init_beanie(
+        database=mongo_db,
+        document_models=[Conversation, AudioChunkDocument, WaveformData, User]
+    )
+
+    # Redis
+    redis_url = os.getenv("REDIS_URL", "redis://redis:6379/0")
+    redis_conn = redis.from_url(redis_url)
+
+    # Qdrant
+    qdrant_client = None
+    try:
+        qdrant_host = os.getenv("QDRANT_BASE_URL", "qdrant")
+        qdrant_port = int(os.getenv("QDRANT_PORT", "6333"))
+        qdrant_client = AsyncQdrantClient(host=qdrant_host, port=qdrant_port)
+    except Exception as e:
+        logger.warning(f"Qdrant not available: {e}")
+
+    # Get current statistics
+    logger.info("Gathering current statistics...")
+    stats = await get_current_stats(mongo_db, redis_conn, qdrant_client)
+
+    # Print current state
+    print_stats(stats, "Current Backend State")
+
+    # Dry-run mode
+    if args.dry_run:
+        print("\n[DRY-RUN MODE] No actual changes will be made\n")
+        if args.backup:
+            print("Would create backup at:", Path(args.backup_dir) / f"backup_{datetime.now().strftime('%Y%m%d_%H%M%S')}")
+            if args.export_audio:
+                print("Would include audio WAV export (1-minute chunks)")
+        print("\nWould delete:")
+        print(f"  - {stats.conversations_count} conversations")
+        print(f"  - {stats.audio_chunks_count} audio chunks")
+        print(f"  - {stats.waveforms_count} waveforms")
+        print(f"  - {stats.chat_sessions_count} chat sessions")
+        print(f"  - {stats.chat_messages_count} chat messages")
+        print(f"  - {stats.memories_count} memories")
+        print(f"  - {stats.redis_jobs_count} Redis jobs")
+        if args.include_wav:
+            print(f"  - {stats.legacy_wav_count} legacy WAV files")
+        if args.delete_users:
+            print(f"  - {stats.users_count} users (DANGEROUS)")
+        else:
+            print(f"  - Users will be preserved ({stats.users_count} users)")
+        print("\nRun without --dry-run to perform actual cleanup")
+        return
+
+    # Confirmation prompt
+    if not args.force:
+        print("\n⚠️  WARNING: This will permanently delete data!")
+        print(f"  - {stats.conversations_count} conversations")
+        print(f"  - {stats.audio_chunks_count} audio chunks")
+        print(f"  - {stats.waveforms_count} waveforms")
+        print(f"  - {stats.chat_sessions_count} chat sessions")
+        print(f"  - {stats.chat_messages_count} chat messages")
+        print(f"  - {stats.memories_count} memories")
+        print(f"  - {stats.redis_jobs_count} Redis jobs")
+        if args.include_wav:
+            print(f"  - {stats.legacy_wav_count} legacy WAV files")
+        if args.delete_users:
+            print(f"  - {stats.users_count} users (DANGEROUS)")
+        else:
+            print(f"  - Users will be preserved ({stats.users_count} users)")
+
+        if args.backup:
+            print(f"\n✓ Backup will be created at: {args.backup_dir}")
+            if args.export_audio:
+                print("✓ Audio will be exported as WAV files")
+        else:
+            print("\n✗ No backup will be created")
+
+        print()
+        if not confirm_action("Are you sure you want to proceed?"):
+            logger.info("Cleanup cancelled by user")
+            return
+
+    # Create backup if requested
+    if args.backup:
+        backup_manager = BackupManager(args.backup_dir, args.export_audio, mongo_db)
+        success = await backup_manager.create_backup(qdrant_client, stats)
+
+        if not success:
+            logger.error("Backup failed, aborting cleanup")
+            return
+
+        print_stats(stats, "Backup Created")
+
+    # Perform cleanup
+    cleanup_manager = CleanupManager(
+        mongo_db,
+        redis_conn,
+        qdrant_client,
+        args.include_wav,
+        args.delete_users
+    )
+
+    success = await cleanup_manager.perform_cleanup(stats)
+
+    if not success:
+        logger.error("Cleanup failed")
+        return
+
+    # Verify cleanup
+    logger.info("Verifying cleanup...")
+    final_stats = await get_current_stats(mongo_db, redis_conn, qdrant_client)
+    print_stats(final_stats, "Backend State After Cleanup")
+
+    logger.info("✓ Cleanup completed successfully!")
+
+    if args.backup:
+        logger.info(f"✓ Backup saved to: {stats.backup_path}")
+
+
+if __name__ == "__main__":
+    try:
+        asyncio.run(main())
+    except KeyboardInterrupt:
+        logger.info("\nCleanup interrupted by user")
+        sys.exit(1)
+    except Exception as e:
+        logger.error(f"Fatal error: {e}", exc_info=True)
+        sys.exit(1)
diff --git a/backends/advanced/tests/test_memory_entry.py b/backends/advanced/tests/test_memory_entry.py
new file mode 100644
index 00000000..fc8ae223
--- /dev/null
+++ b/backends/advanced/tests/test_memory_entry.py
@@ -0,0 +1,158 @@
+"""Unit tests for MemoryEntry dataclass.
+
+Tests timestamp initialization, auto-population, and serialization behavior.
+"""
+
+import time
+from advanced_omi_backend.services.memory.base import MemoryEntry
+
+
+class TestMemoryEntryTimestamps:
+    """Test MemoryEntry timestamp handling."""
+
+    def test_memory_entry_auto_initializes_timestamps(self):
+        """Test that MemoryEntry auto-initializes created_at and updated_at when not provided."""
+        before_creation = int(time.time())
+
+        entry = MemoryEntry(
+            id="test-123",
+            content="Test memory content"
+        )
+
+        after_creation = int(time.time())
+
+        # Both timestamps should be set
+        assert entry.created_at is not None, "created_at should be auto-initialized"
+        assert entry.updated_at is not None, "updated_at should be auto-initialized"
+
+        # Timestamps should be strings
+        assert isinstance(entry.created_at, str), "created_at should be a string"
+        assert isinstance(entry.updated_at, str), "updated_at should be a string"
+
+        # Timestamps should be numeric (Unix timestamps)
+        created_timestamp = int(entry.created_at)
+        updated_timestamp = int(entry.updated_at)
+
+        # Timestamps should be within reasonable range (during test execution)
+        assert before_creation <= created_timestamp <= after_creation, "created_at should be within test execution time"
+        assert before_creation <= updated_timestamp <= after_creation, "updated_at should be within test execution time"
+
+        # Both should be equal since they're created at the same time
+        assert entry.created_at == entry.updated_at, "created_at and updated_at should be equal for new entries"
+
+    def test_memory_entry_with_created_at_only(self):
+        """Test that updated_at defaults to created_at when only created_at is provided."""
+        custom_timestamp = "1234567890"
+
+        entry = MemoryEntry(
+            id="test-123",
+            content="Test memory content",
+            created_at=custom_timestamp
+        )
+
+        assert entry.created_at == custom_timestamp, "created_at should match provided value"
+        assert entry.updated_at == custom_timestamp, "updated_at should default to created_at"
+
+    def test_memory_entry_with_both_timestamps(self):
+        """Test that both timestamps are preserved when explicitly provided."""
+        created_timestamp = "1234567890"
+        updated_timestamp = "1234567900"
+
+        entry = MemoryEntry(
+            id="test-123",
+            content="Test memory content",
+            created_at=created_timestamp,
+            updated_at=updated_timestamp
+        )
+
+        assert entry.created_at == created_timestamp, "created_at should match provided value"
+        assert entry.updated_at == updated_timestamp, "updated_at should match provided value"
+        assert entry.created_at != entry.updated_at, "timestamps should be different when explicitly set"
+
+    def test_memory_entry_to_dict_includes_timestamps(self):
+        """Test that to_dict() serialization includes both timestamp fields."""
+        entry = MemoryEntry(
+            id="test-123",
+            content="Test memory content",
+            metadata={"user_id": "user-456"}
+        )
+
+        entry_dict = entry.to_dict()
+
+        # Verify all expected keys are present
+        assert "id" in entry_dict, "Dict should contain 'id'"
+        assert "memory" in entry_dict, "Dict should contain 'memory' (for frontend)"
+        assert "content" in entry_dict, "Dict should contain 'content'"
+        assert "created_at" in entry_dict, "Dict should contain 'created_at'"
+        assert "updated_at" in entry_dict, "Dict should contain 'updated_at'"
+        assert "metadata" in entry_dict, "Dict should contain 'metadata'"
+        assert "user_id" in entry_dict, "Dict should contain 'user_id' (extracted from metadata)"
+
+        # Verify timestamp values are present and correct
+        assert entry_dict["created_at"] == entry.created_at, "Serialized created_at should match entry"
+        assert entry_dict["updated_at"] == entry.updated_at, "Serialized updated_at should match entry"
+
+        # Verify frontend compatibility
+        assert entry_dict["memory"] == entry.content, "memory field should match content for frontend"
+        assert entry_dict["content"] == entry.content, "content field should match content"
+
+    def test_memory_entry_with_none_timestamps(self):
+        """Test that None timestamps are properly initialized."""
+        entry = MemoryEntry(
+            id="test-123",
+            content="Test memory content",
+            created_at=None,
+            updated_at=None
+        )
+
+        # Both should be auto-initialized even when explicitly set to None
+        assert entry.created_at is not None, "created_at should be auto-initialized from None"
+        assert entry.updated_at is not None, "updated_at should be auto-initialized from None"
+        assert entry.created_at == entry.updated_at, "Both timestamps should be equal when auto-initialized"
+
+    def test_memory_entry_with_all_fields(self):
+        """Test MemoryEntry with all fields populated."""
+        entry = MemoryEntry(
+            id="test-123",
+            content="Test memory content",
+            metadata={"user_id": "user-456", "source": "test"},
+            embedding=[0.1, 0.2, 0.3],
+            score=0.95,
+            created_at="1234567890",
+            updated_at="1234567900"
+        )
+
+        # Verify all fields are preserved
+        assert entry.id == "test-123"
+        assert entry.content == "Test memory content"
+        assert entry.metadata == {"user_id": "user-456", "source": "test"}
+        assert entry.embedding == [0.1, 0.2, 0.3]
+        assert entry.score == 0.95
+        assert entry.created_at == "1234567890"
+        assert entry.updated_at == "1234567900"
+
+        # Verify serialization
+        entry_dict = entry.to_dict()
+        assert entry_dict["score"] == 0.95
+        assert entry_dict["user_id"] == "user-456"
+
+    def test_memory_entry_timestamp_format(self):
+        """Test that timestamps are in the expected format (Unix timestamp strings)."""
+        entry = MemoryEntry(
+            id="test-123",
+            content="Test memory content"
+        )
+
+        # Timestamps should be strings representing Unix timestamps
+        assert entry.created_at.isdigit(), "created_at should be a numeric string"
+        assert entry.updated_at.isdigit(), "updated_at should be a numeric string"
+
+        # Should be parseable as integers
+        created_int = int(entry.created_at)
+        updated_int = int(entry.updated_at)
+
+        # Should be recent timestamps (after year 2020, before year 2100)
+        assert created_int > 1577836800, "Timestamp should be after 2020"
+        assert created_int < 4102444800, "Timestamp should be before 2100"
+        assert updated_int > 1577836800, "Timestamp should be after 2020"
+        assert updated_int < 4102444800, "Timestamp should be before 2100"
diff --git a/backends/advanced/tests/test_memory_providers.py b/backends/advanced/tests/test_memory_providers.py
new file mode 100644
index 00000000..af74bee7
--- /dev/null
+++ b/backends/advanced/tests/test_memory_providers.py
@@ -0,0 +1,239 @@
+"""Unit tests for memory provider timestamp handling.
+
+Tests that all providers properly handle created_at and updated_at fields
+when converting their native formats to MemoryEntry objects.
+"""
+
+import time
+from unittest.mock import Mock
+from advanced_omi_backend.services.memory.providers.mycelia import MyceliaMemoryService
+from advanced_omi_backend.services.memory.providers.openmemory_mcp import OpenMemoryMCPService
+from advanced_omi_backend.services.memory.base import MemoryEntry
+
+
+class TestMyceliaProviderTimestamps:
+    """Test Mycelia provider timestamp handling."""
+
+    def test_mycelia_object_to_memory_entry_with_both_timestamps(self):
+        """Test that Mycelia provider extracts both created_at and updated_at."""
+        # Create a Mycelia service instance
+        service = MyceliaMemoryService(Mock())
+
+        # Mock Mycelia API object response
+        mycelia_obj = {
+            "_id": {"$oid": "507f1f77bcf86cd799439011"},
+            "name": "Test Memory",
+            "details": "Test content",
+            "createdAt": {"$date": "2024-01-01T00:00:00.000Z"},
+            "updatedAt": {"$date": "2024-01-02T00:00:00.000Z"},
+            "isPerson": False,
+            "isEvent": False,
+        }
+
+        # Convert to MemoryEntry
+        entry = service._mycelia_object_to_memory_entry(mycelia_obj, user_id="user-123")
+
+        # Verify both timestamps are extracted
+        assert entry.created_at is not None, "created_at should be extracted"
+        assert entry.updated_at is not None, "updated_at should be extracted"
+
+        # Verify timestamps match the source
+        assert entry.created_at == "2024-01-01T00:00:00.000Z", "created_at should match Mycelia createdAt"
+        assert entry.updated_at == "2024-01-02T00:00:00.000Z", "updated_at should match Mycelia updatedAt"
+
+        # Verify timestamps are different (updated after created)
+        assert entry.created_at != entry.updated_at, "Timestamps should be different"
+
+    def test_mycelia_object_to_memory_entry_with_missing_updated_at(self):
+        """Test that Mycelia provider handles missing updatedAt gracefully."""
+        service = MyceliaMemoryService(Mock())
+
+        # Mock Mycelia object without updatedAt
+        mycelia_obj = {
+            "_id": {"$oid": "507f1f77bcf86cd799439011"},
+            "name": "Test Memory",
+            "details": "Test content",
+            "createdAt": {"$date": "2024-01-01T00:00:00.000Z"},
+            # updatedAt is missing
+            "isPerson": False,
+            "isEvent": False,
+        }
+
+        # Convert to MemoryEntry
+        entry = service._mycelia_object_to_memory_entry(mycelia_obj, user_id="user-123")
+
+        # created_at should be present
+        assert entry.created_at is not None, "created_at should be extracted"
+
+        # updated_at should default to created_at (via MemoryEntry __post_init__)
+        # The _extract_bson_date returns None for missing fields, then __post_init__ sets it to created_at
+        assert entry.updated_at is not None, "updated_at should be set by __post_init__"
+        assert entry.updated_at == entry.created_at, "updated_at should default to created_at when missing"
+
+    def test_mycelia_extract_bson_date(self):
+        """Test Mycelia BSON date extraction."""
+        service = MyceliaMemoryService(Mock())
+
+        # Test BSON date format
+        bson_date = {"$date": "2024-01-01T00:00:00.000Z"}
+        extracted = service._extract_bson_date(bson_date)
+        assert extracted == "2024-01-01T00:00:00.000Z", "Should extract date from BSON format"
+
+        # Test plain string date
+        plain_date = "2024-01-01T00:00:00.000Z"
+        extracted = service._extract_bson_date(plain_date)
+        assert extracted == "2024-01-01T00:00:00.000Z", "Should pass through plain date"
+
+        # Test None
+        extracted = service._extract_bson_date(None)
+        assert extracted is None, "Should return None for None input"
+
+
+class TestOpenMemoryMCPProviderTimestamps:
+    """Test OpenMemory MCP provider timestamp handling."""
+
+    def test_mcp_result_to_memory_entry_with_both_timestamps(self):
+        """Test that OpenMemory MCP provider extracts both timestamps."""
+        # Create OpenMemory MCP service instance
+        service = OpenMemoryMCPService()
+        service.client_name = "test-client"
+        service.server_url = "http://localhost:8765"
+
+        # Mock MCP API response
+        mcp_result = {
+            "id": "mem-123",
+            "content": "Test memory content",
+            "created_at": "1704067200",  # 2024-01-01 00:00:00 UTC
+            "updated_at": "1704153600",  # 2024-01-02 00:00:00 UTC
+            "metadata": {"source": "test"}
+        }
+
+        # Convert to MemoryEntry
+        entry = service._mcp_result_to_memory_entry(mcp_result, user_id="user-123")
+
+        # Verify both timestamps are extracted
+        assert entry is not None, "MemoryEntry should be created"
+        assert entry.created_at is not None, "created_at should be extracted"
+        assert entry.updated_at is not None, "updated_at should be extracted"
+
+        # Verify timestamps match the source
+        assert entry.created_at == "1704067200", "created_at should match MCP response"
+        assert entry.updated_at == "1704153600", "updated_at should match MCP response"
+
+        # Verify timestamps are different
+        assert entry.created_at != entry.updated_at, "Timestamps should be different"
+
+    def test_mcp_result_to_memory_entry_with_missing_updated_at(self):
+        """Test that OpenMemory MCP provider defaults updated_at to created_at when missing."""
+        service = OpenMemoryMCPService()
+        service.client_name = "test-client"
+        service.server_url = "http://localhost:8765"
+
+        # Mock MCP response without updated_at
+        mcp_result = {
+            "id": "mem-123",
+            "content": "Test memory content",
+            "created_at": "1704067200",
+            # updated_at is missing
+        }
+
+        # Convert to MemoryEntry
+        entry = service._mcp_result_to_memory_entry(mcp_result, user_id="user-123")
+
+        # Verify updated_at defaults to created_at
+        assert entry is not None, "MemoryEntry should be created"
+        assert entry.created_at is not None, "created_at should be present"
+        assert entry.updated_at is not None, "updated_at should default to created_at"
+        assert entry.created_at == entry.updated_at, "updated_at should equal created_at when missing"
+
+    def test_mcp_result_to_memory_entry_with_alternate_timestamp_fields(self):
+        """Test that OpenMemory MCP provider handles alternate timestamp field names."""
+        service = OpenMemoryMCPService()
+        service.client_name = "test-client"
+        service.server_url = "http://localhost:8765"
+
+        # Mock MCP response with alternate field names
+        mcp_result = {
+            "id": "mem-123",
+            "memory": "Test memory content",  # Alternate content field
+            "timestamp": "1704067200",  # Alternate created_at field
+            "modified_at": "1704153600",  # Alternate updated_at field
+        }
+
+        # Convert to MemoryEntry
+        entry = service._mcp_result_to_memory_entry(mcp_result, user_id="user-123")
+
+        # Verify conversion handles alternate field names
+        assert entry is not None, "MemoryEntry should be created"
+        assert entry.content == "Test memory content", "Should extract from 'memory' field"
+        assert entry.created_at == "1704067200", "Should extract from 'timestamp' field"
+        assert entry.updated_at == "1704153600", "Should extract from 'modified_at' field"
+
+    def test_mcp_result_with_no_timestamps(self):
+        """Test that OpenMemory MCP provider generates timestamps when none provided."""
+        service = OpenMemoryMCPService()
+        service.client_name = "test-client"
+        service.server_url = "http://localhost:8765"
+
+        before_conversion = int(time.time())
+
+        # Mock MCP response without any timestamp fields
+        mcp_result = {
+            "id": "mem-123",
+            "content": "Test memory content",
+        }
+
+        # Convert to MemoryEntry
+        entry = service._mcp_result_to_memory_entry(mcp_result, user_id="user-123")
+
+        after_conversion = int(time.time())
+
+        # Verify timestamps are auto-generated
+        assert entry is not None, "MemoryEntry should be created"
+        assert entry.created_at is not None, "created_at should be auto-generated"
+        assert entry.updated_at is not None, "updated_at should be auto-generated"
+
+        # Verify timestamps are current (within test execution window)
+        created_int = int(entry.created_at)
+        updated_int = int(entry.updated_at)
+        assert before_conversion <= created_int <= after_conversion, "Timestamp should be current"
+        assert before_conversion <= updated_int <= after_conversion, "Timestamp should be current"
+
+
+class TestProviderTimestampConsistency:
+    """Test that all providers handle timestamps consistently."""
+
+    def test_all_providers_return_memory_entry_with_timestamps(self):
+        """Test that all providers return MemoryEntry objects with both timestamp fields."""
+        # This is a meta-test to ensure all providers conform to the MemoryEntry interface
+
+        # Mycelia
+        mycelia_service = MyceliaMemoryService(Mock())
+        mycelia_obj = {
+            "_id": {"$oid": "507f1f77bcf86cd799439011"},
+            "name": "Test",
+            "details": "Content",
+            "createdAt": {"$date": "2024-01-01T00:00:00.000Z"},
+            "updatedAt": {"$date": "2024-01-02T00:00:00.000Z"},
+        }
+        mycelia_entry = mycelia_service._mycelia_object_to_memory_entry(mycelia_obj, "user-123")
+
+        # OpenMemory MCP
+        mcp_service = OpenMemoryMCPService()
+        mcp_service.client_name = "test"
+        mcp_service.server_url = "http://localhost:8765"
+        mcp_result = {
+            "id": "mem-123",
+            "content": "Content",
+            "created_at": "1704067200",
+            "updated_at": "1704153600",
+        }
+        mcp_entry = mcp_service._mcp_result_to_memory_entry(mcp_result, "user-123")
+
+        # Verify all return MemoryEntry instances with both timestamp fields
+        for entry, provider_name in [(mycelia_entry, "Mycelia"), (mcp_entry, "OpenMemory MCP")]:
+            assert isinstance(entry, MemoryEntry), f"{provider_name} should return MemoryEntry"
+            assert hasattr(entry, "created_at"), f"{provider_name} entry should have created_at"
+            assert hasattr(entry, "updated_at"), f"{provider_name} entry should have updated_at"
+            assert entry.created_at is not None, f"{provider_name} created_at should not be None"
+            assert entry.updated_at is not None, f"{provider_name} updated_at should not be None"
diff --git a/backends/advanced/webui/src/components/audio/WaveformDisplay.tsx b/backends/advanced/webui/src/components/audio/WaveformDisplay.tsx
new file mode 100644
index 00000000..aaf0c442
--- /dev/null
+++ b/backends/advanced/webui/src/components/audio/WaveformDisplay.tsx
@@ -0,0 +1,173 @@
+import React, { useEffect, useRef, useState } from 'react';
+import { api } from '../../services/api';
+
+interface WaveformData {
+  samples: number[];
+  sample_rate: number;
+  duration_seconds: number;
+}
+
+interface WaveformDisplayProps {
+  conversationId: string;
+  duration: number;
+  currentTime?: number;  // Current playback position in seconds
+  onSeek?: (time: number) => void;  // Callback when user clicks to seek
+  height?: number;  // Canvas height in pixels (default: 100)
+}
+
+export const WaveformDisplay: React.FC<WaveformDisplayProps> = ({
+  conversationId,
+  duration,
+  currentTime,
+  onSeek,
+  height = 100
+}) => {
+  const [waveformData, setWaveformData] = useState<WaveformData | null>(null);
+  const [loading, setLoading] = useState(true);
+  const [error, setError] = useState<string | null>(null);
+  const canvasRef = useRef<HTMLCanvasElement>(null);
+
+  // Fetch waveform data on component mount
+  useEffect(() => {
+    const fetchWaveform = async () => {
+      setLoading(true);
+      setError(null);
+
+      try {
+        const response = await api.get(`/api/conversations/${conversationId}/waveform`);
+        setWaveformData(response.data);
+      } catch (err: any) {
+        const errorMsg = err?.response?.data?.detail || err?.message || 'Failed to load waveform';
+        console.error('Waveform fetch failed:', errorMsg);
+        setError(errorMsg);
+      } finally {
+        setLoading(false);
+      }
+    };
+
+    fetchWaveform();
+  }, [conversationId]);
+
+  // Draw waveform when data changes
+  useEffect(() => {
+    if (!waveformData || !canvasRef.current) return;
+
+    const canvas = canvasRef.current;
+    const ctx = canvas.getContext('2d');
+    if (!ctx) return;
+
+    // Set canvas size
+    const rect = canvas.getBoundingClientRect();
+    canvas.width = rect.width * window.devicePixelRatio;
+    canvas.height = height * window.devicePixelRatio;
+    ctx.scale(window.devicePixelRatio, window.devicePixelRatio);
+
+    // Clear canvas
+    ctx.clearRect(0, 0, rect.width, height);
+
+    // Draw waveform bars
+    drawWaveform(ctx, waveformData.samples, rect.width, height);
+
+    // Draw playback position indicator
+    if (currentTime !== undefined && duration > 0) {
+      drawPlaybackIndicator(ctx, currentTime, duration, rect.width, height);
+    }
+  }, [waveformData, currentTime, duration, height]);
+
+  const drawWaveform = (
+    ctx: CanvasRenderingContext2D,
+    samples: number[],
+    width: number,
+    height: number
+  ) => {
+    const barWidth = width / samples.length;
+    const centerY = height / 2;
+
+    ctx.fillStyle = '#3b82f6'; // Blue bars (Tailwind blue-500)
+
+    samples.forEach((amplitude, i) => {
+      const x = i * barWidth;
+      const barHeight = Math.max(1, amplitude * centerY); // Ensure minimum 1px height
+
+      // Draw bar centered vertically
+      ctx.fillRect(x, centerY - barHeight, barWidth - 1, barHeight * 2);
+    });
+  };
+
+  const drawPlaybackIndicator = (
+    ctx: CanvasRenderingContext2D,
+    currentTime: number,
+    duration: number,
+    width: number,
+    height: number
+  ) => {
+    const progress = currentTime / duration;
+    const x = progress * width;
+
+    // Draw vertical line
+    ctx.strokeStyle = '#ef4444'; // Red line (Tailwind red-500)
+    ctx.lineWidth = 2;
+    ctx.beginPath();
+    ctx.moveTo(x, 0);
+    ctx.lineTo(x, height);
+    ctx.stroke();
+  };
+
+  const handleClick = (e: React.MouseEvent<HTMLCanvasElement>) => {
+    console.log('🖱️ Waveform clicked!');
+
+    if (!onSeek) {
+      console.warn('⚠️ No onSeek callback provided');
+      return;
+    }
+
+    if (!canvasRef.current) {
+      console.warn('⚠️ Canvas ref not available');
+      return;
+    }
+
+    const rect = canvasRef.current.getBoundingClientRect();
+    const x = e.clientX - rect.left;
+    const seekProgress = x / rect.width;
+    const seekTime = seekProgress * duration;
+
+    console.log(`🎵 Waveform seek: clicked at ${x}px (${(seekProgress * 100).toFixed(1)}%) → ${seekTime.toFixed(2)}s`);
+
+    onSeek(seekTime);
+  };
+
+  // Render loading state
+  if (loading) {
+    return (
+      <div
+        className="w-full bg-gray-100 rounded animate-pulse flex items-center justify-center"
+        style={{ height: `${height}px` }}
+      >
+        <span className="text-gray-400 text-sm">Generating waveform...</span>
+      </div>
+    );
+  }
+
+  // Render error state
+  if (error) {
+    return (
+      <div
+        className="w-full bg-gray-50 border border-gray-200 rounded flex items-center justify-center"
+        style={{ height: `${height}px` }}
+      >
+        <span className="text-gray-400 text-sm">No waveform available</span>
+      </div>
+    );
+  }
+
+  // Render waveform
+  return (
+    <canvas
+      ref={canvasRef}
+      onClick={handleClick}
+      className="w-full cursor-pointer hover:opacity-80 transition-opacity rounded"
+      style={{ height: `${height}px` }}
+      title="Click to seek to position"
+    />
+  );
+};
diff --git a/backends/advanced/webui/src/pages/Archive.tsx b/backends/advanced/webui/src/pages/Archive.tsx
new file mode 100644
index 00000000..4fa7851b
--- /dev/null
+++ b/backends/advanced/webui/src/pages/Archive.tsx
@@ -0,0 +1,389 @@
+import { useState, useEffect } from 'react'
+import { Archive as ArchiveIcon, RefreshCw, Calendar, User, RotateCcw, Trash2, ChevronDown, ChevronUp } from 'lucide-react'
+import { conversationsApi } from '../services/api'
+import { authApi } from '../services/api'
+
+interface Conversation {
+  conversation_id?: string
+  audio_uuid: string
+  title?: string
+  summary?: string
+  created_at?: string
+  client_id: string
+  segment_count?: number
+  memory_count?: number
+  deleted?: boolean
+  deletion_reason?: string
+  deleted_at?: string
+  transcript?: string
+  segments?: Array<{
+    text: string
+    speaker: string
+    start: number
+    end: number
+    confidence?: number
+  }>
+}
+
+export default function Archive() {
+  const [conversations, setConversations] = useState<Conversation[]>([])
+  const [loading, setLoading] = useState(true)
+  const [error, setError] = useState<string | null>(null)
+  const [expandedTranscripts, setExpandedTranscripts] = useState<Set<string>>(new Set())
+  const [restoringConversation, setRestoringConversation] = useState<Set<string>>(new Set())
+  const [deletingConversation, setDeletingConversation] = useState<Set<string>>(new Set())
+  const [isAdmin, setIsAdmin] = useState(false)
+
+  const loadArchivedConversations = async () => {
+    try {
+      setLoading(true)
+      // Include deleted conversations and filter for only deleted ones
+      const response = await conversationsApi.getAll(true)
+      const allConversations = response.data.conversations || []
+      // Filter to show only deleted conversations
+      const deletedConversations = allConversations.filter((conv: Conversation) => conv.deleted === true)
+      setConversations(deletedConversations)
+      setError(null)
+    } catch (err: any) {
+      setError(err.message || 'Failed to load archived conversations')
+    } finally {
+      setLoading(false)
+    }
+  }
+
+  const checkAdminStatus = async () => {
+    try {
+      const response = await authApi.getMe()
+      setIsAdmin(response.data.is_superuser || false)
+    } catch {
+      setIsAdmin(false)
+    }
+  }
+
+  useEffect(() => {
+    loadArchivedConversations()
+    checkAdminStatus()
+  }, [])
+
+  const formatDate = (timestamp: number | string) => {
+    if (typeof timestamp === 'string') {
+      const isoString = timestamp.endsWith('Z') || timestamp.includes('+') || timestamp.includes('T') && timestamp.split('T')[1].includes('-')
+        ? timestamp
+        : timestamp + 'Z'
+      return new Date(isoString).toLocaleString()
+    }
+    if (timestamp === 0) {
+      return 'Unknown date'
+    }
+    return new Date(timestamp * 1000).toLocaleString()
+  }
+
+  const handleRestoreConversation = async (conversationId: string) => {
+    try {
+      setRestoringConversation(prev => new Set(prev).add(conversationId))
+
+      const response = await conversationsApi.restore(conversationId)
+
+      if (response.status === 200) {
+        // Refresh archived conversations to show updated data
+        await loadArchivedConversations()
+      } else {
+        setError(`Failed to restore conversation: ${response.data?.error || 'Unknown error'}`)
+      }
+    } catch (err: any) {
+      setError(`Error restoring conversation: ${err.message || 'Unknown error'}`)
+    } finally {
+      setRestoringConversation(prev => {
+        const newSet = new Set(prev)
+        newSet.delete(conversationId)
+        return newSet
+      })
+    }
+  }
+
+  const handlePermanentDelete = async (conversationId: string) => {
+    try {
+      const confirmed = window.confirm(
+        'Are you sure you want to PERMANENTLY delete this conversation? This action CANNOT be undone and will remove all data including audio.'
+      )
+      if (!confirmed) return
+
+      setDeletingConversation(prev => new Set(prev).add(conversationId))
+
+      const response = await conversationsApi.permanentDelete(conversationId)
+
+      if (response.status === 200) {
+        // Refresh archived conversations to show updated data
+        await loadArchivedConversations()
+      } else {
+        setError(`Failed to permanently delete conversation: ${response.data?.error || 'Unknown error'}`)
+      }
+    } catch (err: any) {
+      setError(`Error permanently deleting conversation: ${err.message || 'Unknown error'}`)
+    } finally {
+      setDeletingConversation(prev => {
+        const newSet = new Set(prev)
+        newSet.delete(conversationId)
+        return newSet
+      })
+    }
+  }
+
+  const toggleTranscriptExpansion = async (conversationId: string) => {
+    if (expandedTranscripts.has(conversationId)) {
+      setExpandedTranscripts(prev => {
+        const newSet = new Set(prev)
+        newSet.delete(conversationId)
+        return newSet
+      })
+      return
+    }
+
+    const conversation = conversations.find(c => c.conversation_id === conversationId)
+    if (!conversation || !conversation.conversation_id) {
+      return
+    }
+
+    if (conversation.segments && conversation.segments.length > 0) {
+      setExpandedTranscripts(prev => new Set(prev).add(conversationId))
+      return
+    }
+
+    try {
+      const response = await conversationsApi.getById(conversation.conversation_id)
+      if (response.status === 200 && response.data.conversation) {
+        setConversations(prev => prev.map(c =>
+          c.conversation_id === conversationId
+            ? { ...c, ...response.data.conversation }
+            : c
+        ))
+        setExpandedTranscripts(prev => new Set(prev).add(conversationId))
+      }
+    } catch (err: any) {
+      console.error('Failed to fetch conversation details:', err)
+      setError(`Failed to load transcript: ${err.message || 'Unknown error'}`)
+    }
+  }
+
+  if (loading) {
+    return (
+      <div className="flex items-center justify-center h-64">
+        <div className="animate-spin rounded-full h-8 w-8 border-b-2 border-blue-600"></div>
+        <span className="ml-2 text-gray-600 dark:text-gray-400">Loading archived conversations...</span>
+      </div>
+    )
+  }
+
+  if (error) {
+    return (
+      <div className="text-center">
+        <div className="text-red-600 dark:text-red-400 mb-4">{error}</div>
+        <button
+          onClick={loadArchivedConversations}
+          className="px-4 py-2 bg-blue-600 text-white rounded-lg hover:bg-blue-700 transition-colors"
+        >
+          Try Again
+        </button>
+      </div>
+    )
+  }
+
+  return (
+    <div>
+      {/* Header */}
+      <div className="flex justify-between items-center mb-6">
+        <div className="flex items-center space-x-2">
+          <ArchiveIcon className="h-6 w-6 text-orange-600" />
+          <h1 className="text-2xl font-bold text-gray-900 dark:text-gray-100">
+            Archived Conversations
+          </h1>
+        </div>
+        <button
+          onClick={loadArchivedConversations}
+          className="flex items-center space-x-2 px-4 py-2 bg-blue-600 text-white rounded-lg hover:bg-blue-700 transition-colors"
+        >
+          <RefreshCw className="h-4 w-4" />
+          <span>Refresh</span>
+        </button>
+      </div>
+
+      {/* Archive Info */}
+      <div className="mb-4 p-3 bg-orange-50 dark:bg-orange-900/20 rounded-lg border border-orange-300 dark:border-orange-700">
+        <p className="text-sm text-orange-800 dark:text-orange-300">
+          <strong>Archive:</strong> Deleted conversations are stored here. You can restore them to active view or permanently delete them {isAdmin && '(admin only)'}.
+        </p>
+      </div>
+
+      {/* Archived Conversations List */}
+      <div className="space-y-6">
+        {conversations.length === 0 ? (
+          <div className="text-center text-gray-500 dark:text-gray-400 py-12">
+            <ArchiveIcon className="h-12 w-12 mx-auto mb-4 opacity-50" />
+            <p>No archived conversations</p>
+          </div>
+        ) : (
+          conversations.map((conversation) => (
+            <div
+              key={conversation.conversation_id || conversation.audio_uuid}
+              className="rounded-lg p-6 border bg-red-50 dark:bg-red-900/20 border-red-300 dark:border-red-700"
+            >
+              {/* Deleted Conversation Banner */}
+              <div className="mb-4 p-3 bg-red-100 dark:bg-red-900/40 rounded-lg border border-red-300 dark:border-red-700">
+                <div className="flex items-start space-x-2">
+                  <ArchiveIcon className="h-5 w-5 text-red-600 dark:text-red-400 mt-0.5 flex-shrink-0" />
+                  <div className="flex-1">
+                    <p className="font-semibold text-red-800 dark:text-red-300 text-sm">Archived Conversation</p>
+                    <p className="text-xs text-red-700 dark:text-red-400 mt-1">
+                      Reason: {conversation.deletion_reason === 'user_deleted'
+                        ? 'User deleted'
+                        : conversation.deletion_reason === 'no_meaningful_speech'
+                        ? 'No meaningful speech detected'
+                        : conversation.deletion_reason === 'audio_file_not_ready'
+                        ? 'Audio file not saved (possible Bluetooth disconnect)'
+                        : conversation.deletion_reason || 'Unknown'}
+                    </p>
+                    {conversation.deleted_at && (
+                      <p className="text-xs text-red-600 dark:text-red-500 mt-1">
+                        Deleted at: {formatDate(conversation.deleted_at)}
+                      </p>
+                    )}
+                  </div>
+                </div>
+              </div>
+
+              {/* Conversation Header */}
+              <div className="flex justify-between items-start mb-4">
+                <div className="flex flex-col space-y-2">
+                  <h2 className="text-xl font-semibold text-gray-900 dark:text-gray-100">
+                    {conversation.title || "Conversation"}
+                  </h2>
+
+                  {conversation.summary && (
+                    <p className="text-sm text-gray-600 dark:text-gray-400 italic">
+                      {conversation.summary}
+                    </p>
+                  )}
+
+                  {/* Metadata */}
+                  <div className="flex items-center space-x-4">
+                    <div className="flex items-center space-x-2 text-sm text-gray-600 dark:text-gray-400">
+                      <Calendar className="h-4 w-4" />
+                      <span>{formatDate(conversation.created_at || '')}</span>
+                    </div>
+                    <div className="flex items-center space-x-2 text-sm text-gray-600 dark:text-gray-400">
+                      <User className="h-4 w-4" />
+                      <span>{conversation.client_id}</span>
+                    </div>
+                  </div>
+                </div>
+
+                {/* Action Buttons */}
+                <div className="flex items-center space-x-2">
+                  {conversation.conversation_id && (
+                    <>
+                      <button
+                        onClick={() => handleRestoreConversation(conversation.conversation_id!)}
+                        disabled={restoringConversation.has(conversation.conversation_id)}
+                        className="flex items-center space-x-2 px-3 py-2 bg-green-600 text-white rounded-lg hover:bg-green-700 transition-colors disabled:opacity-50 disabled:cursor-not-allowed"
+                        title="Restore conversation to active view"
+                      >
+                        {restoringConversation.has(conversation.conversation_id) ? (
+                          <RefreshCw className="h-4 w-4 animate-spin" />
+                        ) : (
+                          <RotateCcw className="h-4 w-4" />
+                        )}
+                        <span>Restore</span>
+                      </button>
+
+                      {isAdmin && (
+                        <button
+                          onClick={() => handlePermanentDelete(conversation.conversation_id!)}
+                          disabled={deletingConversation.has(conversation.conversation_id)}
+                          className="flex items-center space-x-2 px-3 py-2 bg-red-600 text-white rounded-lg hover:bg-red-700 transition-colors disabled:opacity-50 disabled:cursor-not-allowed"
+                          title="Permanently delete (admin only)"
+                        >
+                          {deletingConversation.has(conversation.conversation_id) ? (
+                            <RefreshCw className="h-4 w-4 animate-spin" />
+                          ) : (
+                            <Trash2 className="h-4 w-4" />
+                          )}
+                          <span>Permanent Delete</span>
+                        </button>
+                      )}
+                    </>
+                  )}
+                </div>
+              </div>
+
+              {/* Transcript */}
+              <div className="space-y-2">
+                {(() => {
+                  const segments = conversation.segments || []
+
+                  return (
+                    <>
+                      {/* Transcript Header with Expand/Collapse */}
+                      <div
+                        className="flex items-center justify-between cursor-pointer p-2 rounded-lg hover:bg-gray-100 dark:hover:bg-gray-600 transition-colors"
+                        onClick={() => conversation.conversation_id && toggleTranscriptExpansion(conversation.conversation_id)}
+                      >
+                        <h3 className="font-medium text-gray-900 dark:text-gray-100">
+                          Transcript {(segments.length > 0 || conversation.segment_count) && (
+                            <span className="text-sm text-gray-500 dark:text-gray-400 ml-1">
+                              ({segments.length || conversation.segment_count || 0} segments)
+                            </span>
+                          )}
+                        </h3>
+                        <div className="flex items-center space-x-2">
+                          {conversation.conversation_id && expandedTranscripts.has(conversation.conversation_id) ? (
+                            <ChevronUp className="h-5 w-5 text-gray-500 dark:text-gray-400 transition-transform duration-200" />
+                          ) : (
+                            <ChevronDown className="h-5 w-5 text-gray-500 dark:text-gray-400 transition-transform duration-200" />
+                          )}
+                        </div>
+                      </div>
+
+                      {/* Transcript Content - Conditionally Rendered */}
+                      {conversation.conversation_id && expandedTranscripts.has(conversation.conversation_id) && (
+                        <div className="animate-in slide-in-from-top-2 duration-300 ease-out space-y-4">
+                          {segments.length > 0 ? (
+                            <div className="p-4 bg-white dark:bg-gray-800 rounded-lg border border-gray-200 dark:border-gray-600">
+                              <div className="space-y-1">
+                                {segments.map((segment, index) => {
+                                  const speaker = segment.speaker || 'Unknown'
+                                  return (
+                                    <div
+                                      key={index}
+                                      className="text-sm leading-relaxed flex items-start space-x-2 py-1 px-2 rounded hover:bg-gray-50 dark:hover:bg-gray-700"
+                                    >
+                                      <div className="flex-1 min-w-0">
+                                        <span className="font-medium text-blue-600 dark:text-blue-400">
+                                          {speaker}:
+                                        </span>
+                                        <span className="text-gray-900 dark:text-gray-100 ml-1">
+                                          {segment.text}
+                                        </span>
+                                      </div>
+                                    </div>
+                                  )
+                                })}
+                              </div>
+                            </div>
+                          ) : (
+                            <div className="text-sm text-gray-500 dark:text-gray-400 italic p-4 bg-white dark:bg-gray-800 rounded-lg border border-gray-200 dark:border-gray-600">
+                              No transcript available
+                            </div>
+                          )}
+                        </div>
+                      )}
+                    </>
+                  )
+                })()}
+              </div>
+            </div>
+          ))
+        )}
+      </div>
+    </div>
+  )
+}
diff --git a/backends/advanced/webui/src/pages/Conversations.tsx b/backends/advanced/webui/src/pages/Conversations.tsx
index cd60dc08..bedde106 100644
--- a/backends/advanced/webui/src/pages/Conversations.tsx
+++ b/backends/advanced/webui/src/pages/Conversations.tsx
@@ -1,8 +1,9 @@
-import { useState, useEffect, useRef } from 'react'
+import { useState, useEffect, useRef, useCallback } from 'react'
 import { MessageSquare, RefreshCw, Calendar, User, Play, Pause, MoreVertical, RotateCcw, Zap, ChevronDown, ChevronUp, Trash2 } from 'lucide-react'
 import { conversationsApi, BACKEND_URL } from '../services/api'
 import ConversationVersionHeader from '../components/ConversationVersionHeader'
 import { getStorageKey } from '../utils/storage'
+import { WaveformDisplay } from '../components/audio/WaveformDisplay'
 
 interface Conversation {
   conversation_id?: string
@@ -15,6 +16,8 @@ interface Conversation {
   segment_count?: number  // From list endpoint
   memory_count?: number  // From list endpoint
   audio_path?: string
+  audio_chunks_count?: number  // Number of MongoDB audio chunks
+  audio_total_duration?: number  // Total duration in seconds
   duration_seconds?: number
   has_memory?: boolean
   transcript?: string  // From detail endpoint
@@ -60,6 +63,7 @@ export default function Conversations() {
   const [expandedDetailedSummaries, setExpandedDetailedSummaries] = useState<Set<string>>(new Set())
   // Audio playback state
   const [playingSegment, setPlayingSegment] = useState<string | null>(null) // Format: "audioUuid-segmentIndex"
+  const [audioCurrentTime, setAudioCurrentTime] = useState<{ [conversationId: string]: number }>({})
   const audioRefs = useRef<{ [key: string]: HTMLAudioElement }>({})
   const segmentTimerRef = useRef<number | null>(null)
 
@@ -69,10 +73,68 @@ export default function Conversations() {
   const [reprocessingMemory, setReprocessingMemory] = useState<Set<string>>(new Set())
   const [deletingConversation, setDeletingConversation] = useState<Set<string>>(new Set())
 
+  // Stable seek handler for waveform click-to-seek
+  const handleSeek = useCallback((conversationId: string, time: number) => {
+    console.log(`🎯 handleSeek called: conversationId=${conversationId}, time=${time.toFixed(2)}s`);
+
+    const audioElement = audioRefs.current[conversationId];
+
+    if (!audioElement) {
+      console.error(`❌ Audio element not found for conversation ${conversationId}`);
+      console.log('Available audio refs:', Object.keys(audioRefs.current));
+      return;
+    }
+
+    console.log(`📍 Audio element found, readyState=${audioElement.readyState}, paused=${audioElement.paused}`);
+
+    // Check if audio is ready for seeking (readyState >= 1 means HAVE_METADATA)
+    if (audioElement.readyState < 1) {
+      console.warn(`⚠️ Audio not ready for seeking (readyState=${audioElement.readyState})`);
+      // Try again after metadata loads
+      audioElement.addEventListener('loadedmetadata', () => {
+        console.log('✅ Metadata loaded, retrying seek');
+        audioElement.currentTime = time;
+      }, { once: true });
+      return;
+    }
+
+    try {
+      // Force a small delay to ensure audio is ready
+      const wasPlaying = !audioElement.paused;
+
+      // Pause before seeking (helps with seeking reliability)
+      if (wasPlaying) {
+        audioElement.pause();
+      }
+
+      // Set the seek position
+      audioElement.currentTime = time;
+
+      // Verify the seek worked
+      setTimeout(() => {
+        console.log(`✅ Seek complete: requested=${time.toFixed(2)}s, actual=${audioElement.currentTime.toFixed(2)}s`);
+
+        if (Math.abs(audioElement.currentTime - time) > 1.0) {
+          console.error(`⚠️ Seek failed! Requested ${time.toFixed(2)}s but got ${audioElement.currentTime.toFixed(2)}s`);
+        }
+      }, 100);
+
+      // Resume playback if it was playing
+      if (wasPlaying) {
+        audioElement.play().catch(err => {
+          console.warn('Could not resume playback after seek:', err);
+        });
+      }
+    } catch (err) {
+      console.error('❌ Seek failed:', err);
+    }
+  }, []); // Empty deps - uses ref which is always stable
+
   const loadConversations = async () => {
     try {
       setLoading(true)
-      const response = await conversationsApi.getAll()
+      // Exclude deleted conversations from main view
+      const response = await conversationsApi.getAll(false)
       // API now returns a flat list with client_id as a field
       const conversationsList = response.data.conversations || []
       setConversations(conversationsList)
@@ -445,38 +507,10 @@ export default function Conversations() {
           conversations.map((conversation) => (
             <div
               key={conversation.conversation_id || conversation.audio_uuid}
-              className={`rounded-lg p-6 border ${
-                conversation.deleted
-                  ? 'bg-red-50 dark:bg-red-900/20 border-red-300 dark:border-red-700'
-                  : 'bg-gray-50 dark:bg-gray-700 border-gray-200 dark:border-gray-600'
-              }`}
+              className="rounded-lg p-6 border bg-gray-50 dark:bg-gray-700 border-gray-200 dark:border-gray-600"
             >
-              {/* Deleted Conversation Warning */}
-              {conversation.deleted && (
-                <div className="mb-4 p-3 bg-red-100 dark:bg-red-900/40 rounded-lg border border-red-300 dark:border-red-700">
-                  <div className="flex items-start space-x-2">
-                    <Trash2 className="h-5 w-5 text-red-600 dark:text-red-400 mt-0.5 flex-shrink-0" />
-                    <div className="flex-1">
-                      <p className="font-semibold text-red-800 dark:text-red-300 text-sm">Processing Failed</p>
-                      <p className="text-xs text-red-700 dark:text-red-400 mt-1">
-                        Reason: {conversation.deletion_reason === 'no_meaningful_speech'
-                          ? 'No meaningful speech detected'
-                          : conversation.deletion_reason === 'audio_file_not_ready'
-                          ? 'Audio file not saved (possible Bluetooth disconnect)'
-                          : conversation.deletion_reason || 'Unknown'}
-                      </p>
-                      {conversation.deleted_at && (
-                        <p className="text-xs text-red-600 dark:text-red-500 mt-1">
-                          Deleted at: {new Date(conversation.deleted_at).toLocaleString()}
-                        </p>
-                      )}
-                    </div>
-                  </div>
-                </div>
-              )}
-
               {/* Version Selector Header - Only show for conversations with conversation_id */}
-              {conversation.conversation_id && !conversation.deleted && (
+              {conversation.conversation_id && (
                 <ConversationVersionHeader
                   conversationId={conversation.conversation_id}
                   versionInfo={{
@@ -630,22 +664,52 @@ export default function Conversations() {
                 </div>
               </div>
 
-              {/* Audio Player */}
+              {/* Audio Player with Waveform */}
               <div className="mb-4">
                 <div className="space-y-2">
-                  {conversation.audio_path && (
+                  {(conversation.audio_chunks_count && conversation.audio_chunks_count > 0) && (
                     <>
                       <div className="flex items-center space-x-2 text-sm text-gray-700 dark:text-gray-300">
                         <span className="font-medium">
                           🎵 Audio
                         </span>
                       </div>
+
+                      {/* Waveform Visualization */}
+                      {conversation.conversation_id && conversation.audio_total_duration && (
+                        <WaveformDisplay
+                          conversationId={conversation.conversation_id}
+                          duration={conversation.audio_total_duration}
+                          currentTime={conversation.conversation_id ? audioCurrentTime[conversation.conversation_id] : undefined}
+                          onSeek={(time) => handleSeek(conversation.conversation_id!, time)}
+                          height={80}
+                        />
+                      )}
+
+                      {/* Audio Player */}
                       <audio
+                        ref={(el) => {
+                          if (el && conversation.conversation_id) {
+                            audioRefs.current[conversation.conversation_id] = el;
+                          }
+                        }}
                         controls
                         className="w-full h-10"
                         preload="metadata"
                         style={{ minWidth: '300px' }}
                         src={`${BACKEND_URL}/api/audio/get_audio/${conversation.conversation_id}?token=${localStorage.getItem(getStorageKey('token')) || ''}`}
+                        onTimeUpdate={(e) => {
+                          // Extract currentTime IMMEDIATELY before any async operations
+                          const currentTime = e.currentTarget?.currentTime;
+                          const conversationId = conversation.conversation_id;
+
+                          if (conversationId && currentTime !== undefined) {
+                            setAudioCurrentTime(prev => ({
+                              ...prev,
+                              [conversationId]: currentTime
+                            }));
+                          }
+                        }}
                       >
                         Your browser does not support the audio element.
                       </audio>
@@ -799,8 +863,6 @@ export default function Conversations() {
                   <h4 className="font-medium text-gray-900 dark:text-gray-100 mb-2">🔧 Debug Info:</h4>
                   <div className="text-xs text-gray-600 dark:text-gray-400 space-y-1">
                     <div>Conversation ID: {conversation.conversation_id || 'N/A'}</div>
-                    <div>Audio UUID: {conversation.audio_uuid}</div>
-                    <div>Audio Path: {conversation.audio_path || 'N/A'}</div>
                     <div>Transcript Version Count: {conversation.transcript_version_count || 0}</div>
                     <div>Memory Version Count: {conversation.memory_version_count || 0}</div>
                     <div>Segment Count: {conversation.segment_count || 0}</div>
diff --git a/backends/advanced/webui/src/pages/ConversationsRouter.tsx b/backends/advanced/webui/src/pages/ConversationsRouter.tsx
index c7e6e95c..4cc98a4c 100644
--- a/backends/advanced/webui/src/pages/ConversationsRouter.tsx
+++ b/backends/advanced/webui/src/pages/ConversationsRouter.tsx
@@ -1,9 +1,10 @@
 import { useState } from 'react'
 import Conversations from './Conversations'
 import ConversationsTimeline from './ConversationsTimeline'
+import Archive from './Archive'
 
 export default function ConversationsRouter() {
-  const [activeTab, setActiveTab] = useState<'classic' | 'timeline'>('classic')
+  const [activeTab, setActiveTab] = useState<'classic' | 'timeline' | 'archive'>('classic')
 
   return (
     <div>
@@ -34,14 +35,28 @@ export default function ConversationsRouter() {
           >
             Timeline
           </button>
+          <button
+            onClick={() => setActiveTab('archive')}
+            className={`
+              py-4 px-1 border-b-2 font-medium text-sm transition-colors
+              ${activeTab === 'archive'
+                ? 'border-orange-600 text-orange-600 dark:text-orange-400'
+                : 'border-transparent text-gray-500 hover:text-gray-700 hover:border-gray-300 dark:text-gray-400 dark:hover:text-gray-300'
+              }
+            `}
+          >
+            Archive
+          </button>
         </nav>
       </div>
 
       {/* Content */}
       {activeTab === 'classic' ? (
         <Conversations />
-      ) : (
+      ) : activeTab === 'timeline' ? (
         <ConversationsTimeline />
+      ) : (
+        <Archive />
       )}
     </div>
   )
diff --git a/backends/advanced/webui/src/pages/ConversationsTimeline.tsx b/backends/advanced/webui/src/pages/ConversationsTimeline.tsx
index 40626f5c..2ba55c77 100644
--- a/backends/advanced/webui/src/pages/ConversationsTimeline.tsx
+++ b/backends/advanced/webui/src/pages/ConversationsTimeline.tsx
@@ -87,11 +87,6 @@ function ConversationCard({ conversation, formatDuration }: ConversationCardProp
               {formatDuration(conversation.duration_seconds)}
             </span>
           )}
-          {conversation.deleted && (
-            <span className="px-2 py-1 bg-red-100 text-red-700 rounded">
-              Failed: {conversation.deletion_reason || 'Unknown'}
-            </span>
-          )}
         </div>
       </div>
 
@@ -149,12 +144,6 @@ function ConversationCard({ conversation, formatDuration }: ConversationCardProp
                 <span className="text-gray-600 font-mono">{conversation.conversation_id.slice(0, 8)}...</span>
               </div>
             )}
-            {conversation.audio_uuid && (
-              <div>
-                <span className="font-medium text-gray-700">Audio UUID:</span>{' '}
-                <span className="text-gray-600 font-mono">{conversation.audio_uuid.slice(0, 8)}...</span>
-              </div>
-            )}
             {conversation.active_transcript_version && (
               <div>
                 <span className="font-medium text-gray-700">Transcript Version:</span>{' '}
@@ -168,14 +157,6 @@ function ConversationCard({ conversation, formatDuration }: ConversationCardProp
               </div>
             )}
           </div>
-
-          {/* Audio Path */}
-          {conversation.audio_path && (
-            <div className="text-xs">
-              <span className="font-medium text-gray-700">Audio:</span>{' '}
-              <span className="text-gray-600 font-mono">{conversation.audio_path}</span>
-            </div>
-          )}
         </div>
       )}
     </div>
@@ -190,7 +171,8 @@ export default function ConversationsTimeline() {
   const loadConversations = async () => {
     try {
       setLoading(true)
-      const response = await conversationsApi.getAll()
+      // Exclude deleted conversations from timeline view
+      const response = await conversationsApi.getAll(false)
       const conversationsList = response.data.conversations || []
       setConversations(conversationsList)
       setError(null)
diff --git a/backends/advanced/webui/src/pages/Memories.tsx b/backends/advanced/webui/src/pages/Memories.tsx
index 732d1683..9c488e85 100644
--- a/backends/advanced/webui/src/pages/Memories.tsx
+++ b/backends/advanced/webui/src/pages/Memories.tsx
@@ -174,7 +174,12 @@ export default function Memories() {
     (memory.category?.toLowerCase() || '').includes(searchQuery.toLowerCase())
   )
 
-  const formatDate = (dateInput: string | number) => {
+  const formatDate = (dateInput: string | number | undefined | null) => {
+    // Handle missing/undefined dates
+    if (dateInput === undefined || dateInput === null || dateInput === '') {
+      return 'N/A'
+    }
+
     // Handle both timestamp numbers and date strings
     let date: Date
 
@@ -198,7 +203,7 @@ export default function Memories() {
     // Check if date is valid
     if (isNaN(date.getTime())) {
       console.warn('Invalid date:', dateInput)
-      return 'Invalid Date'
+      return 'N/A'
     }
 
     return date.toLocaleString()
diff --git a/backends/advanced/webui/src/services/api.ts b/backends/advanced/webui/src/services/api.ts
index e5368dcd..9861aaf0 100644
--- a/backends/advanced/webui/src/services/api.ts
+++ b/backends/advanced/webui/src/services/api.ts
@@ -107,9 +107,15 @@ export const authApi = {
 }
 
 export const conversationsApi = {
-  getAll: () => api.get('/api/conversations'),
+  getAll: (includeDeleted?: boolean) => api.get('/api/conversations', {
+    params: includeDeleted !== undefined ? { include_deleted: includeDeleted } : {}
+  }),
   getById: (id: string) => api.get(`/api/conversations/${id}`),
   delete: (id: string) => api.delete(`/api/conversations/${id}`),
+  restore: (id: string) => api.post(`/api/conversations/${id}/restore`),
+  permanentDelete: (id: string) => api.delete(`/api/conversations/${id}`, {
+    params: { permanent: true }
+  }),
 
   // Reprocessing endpoints
   reprocessTranscript: (conversationId: string) => api.post(`/api/conversations/${conversationId}/reprocess-transcript`),
diff --git a/config/defaults.yml b/config/defaults.yml
new file mode 100644
index 00000000..36adbdf4
--- /dev/null
+++ b/config/defaults.yml
@@ -0,0 +1,248 @@
+# Chronicle Default Configuration
+# This file provides sensible defaults for all configuration options.
+# User overrides in config.yml take precedence over these defaults.
+
+defaults:
+  llm: openai-llm
+  embedding: openai-embed
+  stt: stt-deepgram
+  tts: tts-http
+  vector_store: vs-qdrant
+
+models:
+  # ===========================
+  # LLM Models
+  # ===========================
+  - name: openai-llm
+    description: OpenAI GPT-4o-mini
+    model_type: llm
+    model_provider: openai
+    api_family: openai
+    model_name: gpt-4o-mini
+    model_url: https://api.openai.com/v1
+    api_key: ${OPENAI_API_KEY:-}
+    model_params:
+      temperature: 0.2
+      max_tokens: 2000
+    model_output: json
+
+  - name: local-llm
+    description: Local Ollama LLM
+    model_type: llm
+    model_provider: ollama
+    api_family: openai
+    model_name: llama3.1:latest
+    model_url: http://localhost:11434/v1
+    api_key: ${OPENAI_API_KEY:-ollama}
+    model_params:
+      temperature: 0.2
+      max_tokens: 2000
+    model_output: json
+
+  - name: groq-llm
+    description: Groq LLM via OpenAI-compatible API
+    model_type: llm
+    model_provider: groq
+    api_family: openai
+    model_name: llama-3.1-70b-versatile
+    model_url: https://api.groq.com/openai/v1
+    api_key: ${GROQ_API_KEY:-}
+    model_params:
+      temperature: 0.2
+      max_tokens: 2000
+    model_output: json
+
+  # ===========================
+  # Embedding Models
+  # ===========================
+  - name: openai-embed
+    description: OpenAI text-embedding-3-small
+    model_type: embedding
+    model_provider: openai
+    api_family: openai
+    model_name: text-embedding-3-small
+    model_url: https://api.openai.com/v1
+    api_key: ${OPENAI_API_KEY:-}
+    embedding_dimensions: 1536
+    model_output: vector
+
+  - name: local-embed
+    description: Local embeddings via Ollama nomic-embed-text
+    model_type: embedding
+    model_provider: ollama
+    api_family: openai
+    model_name: nomic-embed-text:latest
+    model_url: http://localhost:11434/v1
+    api_key: ${OPENAI_API_KEY:-ollama}
+    embedding_dimensions: 768
+    model_output: vector
+
+  # ===========================
+  # Speech-to-Text Models
+  # ===========================
+  - name: stt-deepgram
+    description: Deepgram Nova 3 (batch)
+    model_type: stt
+    model_provider: deepgram
+    api_family: http
+    model_url: https://api.deepgram.com/v1
+    api_key: ${DEEPGRAM_API_KEY:-}
+    operations:
+      stt_transcribe:
+        method: POST
+        path: /listen
+        headers:
+          Authorization: Token ${DEEPGRAM_API_KEY:-}
+          Content-Type: audio/raw
+        query:
+          model: nova-3
+          language: multi
+          smart_format: 'true'
+          punctuate: 'true'
+          diarize: 'true'
+          encoding: linear16
+          sample_rate: 16000
+          channels: '1'
+        response:
+          type: json
+          extract:
+            text: results.channels[0].alternatives[0].transcript
+            words: results.channels[0].alternatives[0].words
+            segments: results.channels[0].alternatives[0].paragraphs.paragraphs
+
+  - name: stt-parakeet-batch
+    description: Parakeet NeMo ASR (batch)
+    model_type: stt
+    model_provider: parakeet
+    api_family: http
+    model_url: http://${PARAKEET_ASR_URL:-172.17.0.1:8767}
+    api_key: ''
+    operations:
+      stt_transcribe:
+        method: POST
+        path: /transcribe
+        content_type: multipart/form-data
+        response:
+          type: json
+          extract:
+            text: text
+            words: words
+            segments: segments
+
+  # ===========================
+  # Text-to-Speech Models
+  # ===========================
+  - name: tts-http
+    description: Generic JSON TTS endpoint
+    model_type: tts
+    model_provider: custom
+    api_family: http
+    model_url: http://localhost:9000
+    operations:
+      tts_synthesize:
+        method: POST
+        path: /synthesize
+        headers:
+          Content-Type: application/json
+        response:
+          type: json
+
+  # ===========================
+  # Streaming STT Models
+  # ===========================
+  - name: stt-parakeet-stream
+    description: Parakeet streaming transcription over WebSocket
+    model_type: stt_stream
+    model_provider: parakeet
+    api_family: websocket
+    model_url: ws://localhost:9001/stream
+    operations:
+      start:
+        message:
+          type: transcribe
+          config:
+            vad_enabled: true
+            vad_silence_ms: 1000
+            time_interval_seconds: 30
+            return_interim_results: true
+            min_audio_seconds: 0.5
+      chunk_header:
+        message:
+          type: audio_chunk
+          rate: 16000
+          width: 2
+          channels: 1
+      end:
+        message:
+          type: stop
+      expect:
+        interim_type: interim_result
+        final_type: final_result
+        extract:
+          text: text
+          words: words
+          segments: segments
+
+  # ===========================
+  # Vector Store
+  # ===========================
+  - name: vs-qdrant
+    description: Qdrant vector database
+    model_type: vector_store
+    model_provider: qdrant
+    api_family: qdrant
+    model_url: http://${QDRANT_BASE_URL:-qdrant}:${QDRANT_PORT:-6333}
+    model_params:
+      host: ${QDRANT_BASE_URL:-qdrant}
+      port: ${QDRANT_PORT:-6333}
+      collection_name: omi_memories
+
+# ===========================
+# Memory Configuration
+# ===========================
+memory:
+  provider: chronicle
+  timeout_seconds: 1200
+  extraction:
+    enabled: true
+    prompt: |
+      Extract important information from this conversation and return a JSON object with an array named "facts".
+      Include personal preferences, plans, names, dates, locations, numbers, and key details.
+      Keep items concise and useful.
+
+  # OpenMemory MCP provider settings (used when provider: openmemory_mcp)
+  openmemory_mcp:
+    server_url: http://localhost:8765
+    client_name: chronicle
+    user_id: default
+    timeout: 30
+
+  # Mycelia provider settings (used when provider: mycelia)
+  mycelia:
+    api_url: http://localhost:5173
+    timeout: 30
+
+  # Obsidian Neo4j provider settings (legacy)
+  obsidian:
+    enabled: false
+    neo4j_host: neo4j-mem0
+    timeout: 30
+
+# ===========================
+# Speaker Recognition
+# ===========================
+speaker_recognition:
+  # Enable/disable speaker recognition (overrides DISABLE_SPEAKER_RECOGNITION env var)
+  enabled: true
+  # Service URL (defaults to SPEAKER_SERVICE_URL env var if not specified)
+  service_url: null
+  # Request timeout in seconds
+  timeout: 60
+
+# ===========================
+# Chat Configuration
+# ===========================
+chat:
+  system_prompt: |
+    You are a helpful AI assistant with access to the user's conversation history and memories.
+    Provide clear, concise, and accurate responses based on the context available to you.
diff --git a/tests/endpoints/memory_tests.robot b/tests/endpoints/memory_tests.robot
index c8d2af49..b12a4ff6 100644
--- a/tests/endpoints/memory_tests.robot
+++ b/tests/endpoints/memory_tests.robot
@@ -36,12 +36,25 @@ Get User Memories Test
             Dictionary Should Contain Key    ${memory}    id
             Dictionary Should Contain Key    ${memory}    memory
             Dictionary Should Contain Key    ${memory}    created_at
+            Dictionary Should Contain Key    ${memory}    updated_at
             Dictionary Should Contain Key    ${metadata}    source
             Dictionary Should Contain Key    ${metadata}    client_id
             Dictionary Should Contain Key    ${metadata}    source_id
             Dictionary Should Contain Key    ${metadata}    user_id
             Dictionary Should Contain Key    ${metadata}    user_email
 
+            # Verify timestamps are valid (not "Invalid Date", not empty)
+            Should Not Be Equal    ${memory}[created_at]    ${EMPTY}    created_at should not be empty
+            Should Not Be Equal    ${memory}[updated_at]    ${EMPTY}    updated_at should not be empty
+            Should Not Be Equal    ${memory}[created_at]    Invalid Date    created_at should not be "Invalid Date"
+            Should Not Be Equal    ${memory}[updated_at]    Invalid Date    updated_at should not be "Invalid Date"
+
+            # Verify timestamps are numeric strings (Unix timestamps)
+            ${created_timestamp}=    Convert To Integer    ${memory}[created_at]
+            ${updated_timestamp}=    Convert To Integer    ${memory}[updated_at]
+            Should Be True    ${created_timestamp} > 0    created_at should be a positive timestamp
+            Should Be True    ${updated_timestamp} > 0    updated_at should be a positive timestamp
+
             # Check if memory contains "trumpet flower"
             ${memory_text}=    Convert To String    ${memory}[memory]
             ${contains}=    Run Keyword And Return Status    Should Contain    ${memory_text}    trumpet flower    ignore_case=True
diff --git a/tests/integration/sdk_tests.robot b/tests/integration/sdk_tests.robot
new file mode 100644
index 00000000..6101ff6f
--- /dev/null
+++ b/tests/integration/sdk_tests.robot
@@ -0,0 +1,102 @@
+*** Settings ***
+Documentation    Minimal tests for Chronicle Python SDK
+...
+...              Tests basic SDK functionality including authentication,
+...              file upload, and conversation retrieval.
+...
+...              Placeholders included for unimplemented features.
+
+Library          Process
+Library          OperatingSystem
+Library          Collections
+Resource         ../setup/setup_keywords.robot
+Resource         ../setup/teardown_keywords.robot
+Resource         ../resources/session_keywords.robot
+Variables        ../setup/test_env.py
+
+Suite Setup      Suite Setup
+Suite Teardown   Suite Teardown
+
+*** Variables ***
+${BACKEND_URL}        http://localhost:8001
+${SDK_PATH}           ${CURDIR}/../../sdk/python
+${TEST_AUDIO_DIR}     ${CURDIR}/../../extras/test-audios
+
+*** Test Cases ***
+SDK Can Authenticate With Admin Credentials
+    [Documentation]    Test SDK login functionality
+    [Tags]    permissions
+
+    ${result}=    Run Process    uv    run    python
+    ...    ${CURDIR}/../scripts/sdk_test_auth.py
+    ...    ${BACKEND_URL}    ${ADMIN_EMAIL}    ${ADMIN_PASSWORD}
+    Should Be Equal As Integers    ${result.rc}    0    SDK authentication should succeed
+    Should Contain    ${result.stdout}    SUCCESS    Should print success message
+
+SDK Can Upload Audio File
+    [Documentation]    Test SDK audio upload functionality
+    [Tags]    audio-upload
+
+    ${test_audio}=    Set Variable    ${TEST_AUDIO_DIR}/audio_short.wav
+    File Should Exist    ${test_audio}    Test audio file should exist
+
+    ${result}=    Run Process    uv    run    python
+    ...    ${CURDIR}/../scripts/sdk_test_upload.py
+    ...    ${BACKEND_URL}    ${ADMIN_EMAIL}    ${ADMIN_PASSWORD}    ${test_audio}
+    Should Be Equal As Integers    ${result.rc}    0    SDK upload should succeed
+    Should Contain    ${result.stdout}    STATUS:processing    File should be in processing status
+
+SDK Can Retrieve Conversations
+    [Documentation]    Test SDK conversation retrieval
+    [Tags]    conversation
+
+    ${result}=    Run Process    uv    run    python
+    ...    ${CURDIR}/../scripts/sdk_test_conversations.py
+    ...    ${BACKEND_URL}    ${ADMIN_EMAIL}    ${ADMIN_PASSWORD}
+    Should Be Equal As Integers    ${result.rc}    0    SDK should retrieve conversations
+    Should Contain    ${result.stdout}    COUNT:    Should print conversation count
+
+SDK Upload Respects Backend File Size Limit
+    [Documentation]    Verify SDK properly reports backend errors for oversized files
+    [Tags]    audio-upload
+
+    # Note: This tests that SDK handles backend rejection gracefully
+    # The 30-minute limit is enforced by the backend, not the SDK
+    # Full test would require a 30+ minute audio file
+
+    ${result}=    Run Process    uv    run    python
+    ...    ${CURDIR}/../scripts/sdk_test_auth.py
+    ...    ${BACKEND_URL}    ${ADMIN_EMAIL}    ${ADMIN_PASSWORD}
+    Should Be Equal As Integers    ${result.rc}    0    SDK should handle backend errors gracefully
+
+# ==============================================================================
+# PLACEHOLDERS FOR UNIMPLEMENTED FEATURES
+# ==============================================================================
+
+SDK Can Stream Large Audio Files Via WebSocket
+    [Documentation]    PLACEHOLDER: WebSocket streaming support not yet implemented
+    [Tags]    audio-streaming
+    Skip    WebSocket streaming not implemented in SDK yet
+
+SDK Can Resume Interrupted Uploads
+    [Documentation]    PLACEHOLDER: Resumable uploads not supported by backend
+    [Tags]    audio-upload
+    Skip    Resumable uploads not supported
+
+SDK Can Handle Batch Upload With Progress
+    [Documentation]    PLACEHOLDER: Batch upload is implemented but needs Robot test
+    [Tags]    audio-batch
+    Skip    Test implementation pending
+
+SDK Can Search Memories
+    [Documentation]    PLACEHOLDER: Memory search API not exposed in SDK yet
+    [Tags]    memory
+    Skip    Memory search not implemented in SDK
+
+SDK Can Manage Action Items
+    [Documentation]    PLACEHOLDER: Action items API not exposed in SDK yet
+    [Tags]    infra
+    Skip    Action items not implemented in SDK
+
+*** Keywords ***
+# Using Suite Setup/Teardown from setup_keywords.robot
diff --git a/tests/integration/websocket_transcription_e2e_test.robot b/tests/integration/websocket_transcription_e2e_test.robot
new file mode 100644
index 00000000..23b2d8ea
--- /dev/null
+++ b/tests/integration/websocket_transcription_e2e_test.robot
@@ -0,0 +1,246 @@
+*** Settings ***
+Documentation    End-to-End WebSocket Streaming Transcription Tests
+...
+...              This test suite validates the complete transcription data flow
+...              that was previously untested, which led to the end_marker bug.
+...
+...              Critical paths tested:
+...              1. Audio → Deepgram WebSocket → Interim results (pub/sub)
+...              2. Stream close → end_marker sent → CloseStream message
+...              3. Deepgram → Final results → Redis stream transcription:results:{session_id}
+...              4. Speech detection job → Reads Redis stream → Creates conversation
+...
+...              These tests would have caught the missing end_marker bug immediately.
+
+Resource         ../resources/websocket_keywords.robot
+Resource         ../resources/conversation_keywords.robot
+Resource         ../resources/redis_keywords.robot
+Resource         ../resources/queue_keywords.robot
+Resource         ../setup/setup_keywords.robot
+Resource         ../setup/teardown_keywords.robot
+
+Suite Setup      Suite Setup
+Suite Teardown   Suite Teardown
+Test Setup       Test Cleanup
+
+Test Tags        audio-streaming	e2e	requires-api-keys
+
+
+*** Test Cases ***
+
+WebSocket Stream Produces Final Transcripts In Redis
+    [Documentation]    Verify that closing a stream triggers end_marker,
+    ...                CloseStream message to Deepgram, and final results
+    ...                are written to Redis stream transcription:results:{session_id}
+    ...
+    ...                This test directly validates the bug fix:
+    ...                - Producer sends end_marker when finalizing session
+    ...                - Streaming consumer detects end_marker
+    ...                - Consumer sends CloseStream to Deepgram
+    ...                - Deepgram returns final results (is_final=True)
+    ...                - Final results written to Redis stream
+    [Tags]    audio-streaming	infra
+
+    ${device_name}=    Set Variable    final-transcript-test
+    ${client_id}=    Get Client ID From Device Name    ${device_name}
+
+    # Open stream and send audio
+    ${stream_id}=    Open Audio Stream    device_name=${device_name}
+    Send Audio Chunks To Stream    ${stream_id}    ${TEST_AUDIO_FILE}    num_chunks=100
+
+    # Critical: Close stream triggers the entire finalization flow
+    Log    Closing stream - should trigger: end_marker → CloseStream → final results
+    Close Audio Stream    ${stream_id}
+
+    # Allow time for streaming consumer to process end_marker and get final results
+    Sleep    5s
+
+    # Verify Redis stream transcription:results:{client_id} has entries
+    ${stream_name}=    Set Variable    transcription:results:${client_id}
+    ${stream_length}=    Redis Command    XLEN    ${stream_name}
+
+    Should Be True    ${stream_length} > 0
+    ...    Redis stream ${stream_name} is empty - no final transcripts received!
+    ...    This means end_marker was not sent or CloseStream failed.
+
+    Log    ✅ Redis stream has ${stream_length} final transcript(s)
+
+
+Speech Detection Receives Transcription From Stream
+    [Documentation]    Verify speech detection job successfully reads transcripts
+    ...                from Redis stream and does NOT fail with "no_speech_detected"
+    ...
+    ...                This is the exact failure scenario from the bug:
+    ...                - Speech detection reads from transcription:results:{session_id}
+    ...                - If stream is empty, returns "No transcription received"
+    ...                - If stream has data, creates conversation
+    [Tags]    audio-streaming	queue
+
+    ${device_name}=    Set Variable    speech-receives-test
+    ${client_id}=    Get Client ID From Device Name    ${device_name}
+
+    # Stream audio and close
+    ${stream_id}=    Open Audio Stream    device_name=${device_name}
+    Send Audio Chunks To Stream    ${stream_id}    ${TEST_AUDIO_FILE}    num_chunks=200
+    Close Audio Stream    ${stream_id}
+
+    # Wait for speech detection job to complete
+    # It should find transcripts in Redis stream and create conversation
+    ${speech_jobs}=    Wait Until Keyword Succeeds    60s    3s
+    ...    Get Jobs By Type And Client    speech_detection    ${client_id}
+
+    Should Not Be Empty    ${speech_jobs}    No speech detection job found
+
+    # Get the first (most recent) speech detection job
+    ${speech_job}=    Set Variable    ${speech_jobs}[0]
+    ${job_id}=    Set Variable    ${speech_job}[job_id]
+
+    # Wait for job to complete
+    Wait For Job Status    ${job_id}    completed    timeout=60s    interval=2s
+
+    # Get job result
+    ${result}=    Get Job Result    ${job_id}
+
+    # Critical assertion: Job should NOT have "no_speech_detected"
+    # This would indicate the Redis stream was empty
+    Should Not Contain    ${result}    no_speech_detected
+    ...    Speech detection failed with no_speech_detected - Redis stream was empty!
+
+    # Job should have created a conversation
+    Should Contain    ${result}    conversation_job_id
+    ...    Speech detection did not create conversation_job_id
+
+    Log    ✅ Speech detection successfully received transcription from Redis stream
+
+
+Conversation Created With Valid Transcript
+    [Documentation]    End-to-end verification: Audio → Transcription → Conversation
+    ...                Ensures the complete pipeline works with WebSocket streaming
+    [Tags]    audio-streaming	conversation
+
+    ${device_name}=    Set Variable    e2e-conv-test
+    ${client_id}=    Get Client ID From Device Name    ${device_name}
+
+    # Stream audio (enough to trigger speech detection)
+    ${stream_id}=    Open Audio Stream    device_name=${device_name}
+    Send Audio Chunks To Stream    ${stream_id}    ${TEST_AUDIO_FILE}    num_chunks=200
+    Close Audio Stream    ${stream_id}
+
+    # Wait for conversation to be created
+    ${conv_jobs}=    Wait Until Keyword Succeeds    60s    3s
+    ...    Job Type Exists For Client    open_conversation    ${client_id}
+
+    ${conv_job}=    Set Variable    ${conv_jobs}[0]
+    ${conv_meta}=    Set Variable    ${conv_job}[meta]
+    ${conversation_id}=    Evaluate    $conv_meta.get('conversation_id', '')
+
+    Should Not Be Empty    ${conversation_id}
+    ...    Conversation ID not found in open_conversation job metadata
+
+    # Wait for conversation to complete processing (inactivity timeout)
+    Wait For Job Status    ${conv_job}[job_id]    completed    timeout=60s    interval=2s
+
+    # Retrieve the conversation
+    ${conversation}=    Get Conversation By ID    ${conversation_id}
+
+    # Verify conversation has transcript
+    Dictionary Should Contain Key    ${conversation}    transcript
+    ${transcript}=    Set Variable    ${conversation}[transcript]
+    Should Not Be Empty    ${transcript}    Conversation has empty transcript
+
+    # Verify transcript has content (at least 50 characters for meaningful speech)
+    ${transcript_text}=    Run Keyword If    isinstance($transcript, list)
+    ...    Set Variable    ${transcript}[0][text]
+    ...    ELSE    Set Variable    ${transcript}
+
+    ${transcript_length}=    Get Length    ${transcript_text}
+    Should Be True    ${transcript_length} >= 50
+    ...    Transcript too short: ${transcript_length} characters (expected 50+)
+
+    Log    ✅ Conversation created with valid transcript: ${transcript_length} characters
+
+
+Stream Close Sends End Marker To Redis Stream
+    [Documentation]    Verify the producer actually sends end_marker when finalizing
+    ...                This is a low-level infrastructure test to catch the exact bug
+    [Tags]    audio-streaming	infra
+
+    ${device_name}=    Set Variable    end-marker-test
+    ${client_id}=    Get Client ID From Device Name    ${device_name}
+
+    # Open stream and send some audio
+    ${stream_id}=    Open Audio Stream    device_name=${device_name}
+    Send Audio Chunks To Stream    ${stream_id}    ${TEST_AUDIO_FILE}    num_chunks=50
+
+    # Get the audio stream name (where chunks are sent)
+    ${audio_stream_name}=    Set Variable    audio:stream:${client_id}
+
+    # Close stream - this MUST send end_marker
+    Close Audio Stream    ${stream_id}
+
+    # Allow time for end_marker to be written
+    Sleep    2s
+
+    # Read all messages from audio stream to find end_marker
+    ${messages}=    Redis Command    XRANGE    ${audio_stream_name}    -    +
+
+    # Search for end_marker in messages
+    ${found_end_marker}=    Set Variable    ${False}
+    FOR    ${message}    IN    @{messages}
+        # Message format: [message_id, [field1, value1, field2, value2, ...]]
+        ${fields}=    Set Variable    ${message}[1]
+
+        # Check if 'end_marker' field exists
+        ${field_count}=    Get Length    ${fields}
+        FOR    ${index}    IN RANGE    0    ${field_count}    2
+            ${field_name}=    Set Variable    ${fields}[${index}]
+            IF    '${field_name}' == 'end_marker' or b'end_marker' in str($field_name)
+                ${found_end_marker}=    Set Variable    ${True}
+                Log    Found end_marker in audio stream at message ${message}[0]
+                BREAK
+            END
+        END
+
+        IF    ${found_end_marker}
+            BREAK
+        END
+    END
+
+    Should Be True    ${found_end_marker}
+    ...    end_marker NOT found in Redis stream ${audio_stream_name}!
+    ...    Producer.finalize_session() did not send end_marker.
+
+    Log    ✅ end_marker successfully sent to Redis stream
+
+
+Streaming Consumer Closes Deepgram Connection On End Marker
+    [Documentation]    Verify streaming consumer detects end_marker and closes cleanly
+    ...                This tests the consumer side of the bug fix
+    [Tags]    audio-streaming	infra
+
+    ${device_name}=    Set Variable    consumer-close-test
+    ${client_id}=    Get Client ID From Device Name    ${device_name}
+
+    # Stream and close
+    ${stream_id}=    Open Audio Stream    device_name=${device_name}
+    Send Audio Chunks To Stream    ${stream_id}    ${TEST_AUDIO_FILE}    num_chunks=100
+    Close Audio Stream    ${stream_id}
+
+    # Wait for streaming consumer to process end_marker
+    Sleep    10s
+
+    # Check for Deepgram timeout errors in backend logs
+    # If end_marker works, we should NOT see timeout errors
+    ${logs}=    Get Backend Logs    since=30s
+
+    # Should NOT contain Deepgram timeout error
+    Should Not Contain    ${logs}    error 1011
+    ...    Deepgram timeout error found - CloseStream was not sent!
+    ...    This indicates end_marker was not processed by streaming consumer.
+
+    Should Not Contain    ${logs}    Deepgram did not receive audio data or a text message within the timeout window
+    ...    Deepgram timeout found - stream was not closed properly
+
+    Log    ✅ No Deepgram timeout errors - streaming consumer processed end_marker correctly
+
+
diff --git a/tests/resources/queue_keywords.robot b/tests/resources/queue_keywords.robot
index 98012d9a..80856883 100644
--- a/tests/resources/queue_keywords.robot
+++ b/tests/resources/queue_keywords.robot
@@ -324,4 +324,19 @@ Job Should Be Complete
 
     ${job}=    Get Job status    ${job_id}
     ${status}=    Set Variable    ${job}[status]
-    Should Be True    '${status}' in ['completed', 'finished', 'failed']    Job status: ${status}
\ No newline at end of file
+    Should Be True    '${status}' in ['completed', 'finished', 'failed']    Job status: ${status}
+
+
+Get Job Result
+    [Documentation]    Get the result field of a completed job
+    ...                Useful for checking job output/return values
+    [Arguments]    ${job_id}
+
+    # Get full job details
+    ${response}=    GET On Session    api    /api/queue/job/${job_id}
+    ...    expected_status=200
+
+    ${job_data}=    Set Variable    ${response.json()}
+    ${result}=    Set Variable    ${job_data}[result]
+
+    RETURN    ${result}
\ No newline at end of file
diff --git a/tests/resources/redis_keywords.robot b/tests/resources/redis_keywords.robot
index 1aa85e9b..48aaeed0 100644
--- a/tests/resources/redis_keywords.robot
+++ b/tests/resources/redis_keywords.robot
@@ -73,3 +73,37 @@ Session Field Should Equal
     ${actual}=    Get Session Field Value    ${session_id}    ${field_name}
     Should Be Equal    ${actual}    ${expected_value}
     ...    Session field ${field_name} mismatch: expected ${expected_value}, got ${actual}
+
+
+Redis Command
+    [Documentation]    Execute a generic Redis command and return the result
+    ...                Useful for operations like XLEN, XRANGE, etc.
+    [Arguments]    ${command}    @{args}
+
+    # Execute redis-cli command
+    ${result}=    Run Process    docker    exec    ${REDIS_CONTAINER}
+    ...    redis-cli    ${command}    @{args}
+
+    Should Be Equal As Integers    ${result.rc}    0
+    ...    Redis command failed: ${result.stderr}
+
+    # Return stdout, stripping whitespace
+    ${output}=    Strip String    ${result.stdout}
+
+    # Try to convert to integer if it's a number (for commands like XLEN)
+    ${is_digit}=    Run Keyword And Return Status    Should Match Regexp    ${output}    ^\\d+$
+    ${return_value}=    Run Keyword If    ${is_digit}
+    ...    Convert To Integer    ${output}
+    ...    ELSE    Set Variable    ${output}
+
+    RETURN    ${return_value}
+
+
+Get Backend Logs
+    [Documentation]    Get backend container logs for debugging
+    [Arguments]    ${since}=5m
+
+    ${result}=    Run Process    docker    compose    logs    --since    ${since}    chronicle-backend
+    ...    shell=True    stderr=STDOUT
+
+    RETURN    ${result.stdout}
diff --git a/tests/scripts/sdk_test_auth.py b/tests/scripts/sdk_test_auth.py
new file mode 100644
index 00000000..c453998b
--- /dev/null
+++ b/tests/scripts/sdk_test_auth.py
@@ -0,0 +1,18 @@
+#!/usr/bin/env python3
+"""Test SDK authentication."""
+import sys
+from pathlib import Path
+
+# Add SDK to path
+sdk_path = Path(__file__).parent.parent.parent / "sdk" / "python"
+sys.path.insert(0, str(sdk_path))
+
+from chronicle_sdk import ChronicleClient
+
+backend_url = sys.argv[1]
+email = sys.argv[2]
+password = sys.argv[3]
+
+client = ChronicleClient(backend_url)
+client.login(email, password)
+print("SUCCESS")
diff --git a/tests/scripts/sdk_test_conversations.py b/tests/scripts/sdk_test_conversations.py
new file mode 100644
index 00000000..51d1d473
--- /dev/null
+++ b/tests/scripts/sdk_test_conversations.py
@@ -0,0 +1,19 @@
+#!/usr/bin/env python3
+"""Test SDK conversation retrieval."""
+import sys
+from pathlib import Path
+
+# Add SDK to path
+sdk_path = Path(__file__).parent.parent.parent / "sdk" / "python"
+sys.path.insert(0, str(sdk_path))
+
+from chronicle_sdk import ChronicleClient
+
+backend_url = sys.argv[1]
+email = sys.argv[2]
+password = sys.argv[3]
+
+client = ChronicleClient(backend_url)
+client.login(email, password)
+conversations = client.get_conversations(limit=1)
+print(f"COUNT:{len(conversations)}")
diff --git a/tests/scripts/sdk_test_upload.py b/tests/scripts/sdk_test_upload.py
new file mode 100644
index 00000000..12a5a7ec
--- /dev/null
+++ b/tests/scripts/sdk_test_upload.py
@@ -0,0 +1,23 @@
+#!/usr/bin/env python3
+"""Test SDK audio upload."""
+import sys
+from pathlib import Path
+
+# Add SDK to path
+sdk_path = Path(__file__).parent.parent.parent / "sdk" / "python"
+sys.path.insert(0, str(sdk_path))
+
+from chronicle_sdk import ChronicleClient
+
+backend_url = sys.argv[1]
+email = sys.argv[2]
+password = sys.argv[3]
+audio_file = sys.argv[4]
+
+client = ChronicleClient(backend_url, timeout=60)
+client.login(email, password)
+result = client.upload_audio(audio_file)
+
+print(f"STATUS:{result.files[0].status}")
+if result.files[0].conversation_id:
+    print(f"CONVERSATION_ID:{result.files[0].conversation_id}")
diff --git a/tests/unit/test_config_loading.py b/tests/unit/test_config_loading.py
new file mode 100644
index 00000000..28477462
--- /dev/null
+++ b/tests/unit/test_config_loading.py
@@ -0,0 +1,199 @@
+"""Test configuration loading and merging.
+
+Tests for the configuration system that merges defaults.yml with config.yml
+and provides proper caching and reload mechanisms.
+"""
+
+import pytest
+from pathlib import Path
+from advanced_omi_backend.config import get_config, merge_configs, reload_config
+
+
+def test_merge_configs_basic():
+    """Test basic config merging."""
+    defaults = {"a": 1, "b": 2}
+    overrides = {"b": 3, "c": 4}
+
+    result = merge_configs(defaults, overrides)
+
+    assert result["a"] == 1  # From defaults
+    assert result["b"] == 3  # Override
+    assert result["c"] == 4  # New key
+
+
+def test_merge_configs_nested():
+    """Test nested dictionary merging."""
+    defaults = {
+        "memory": {
+            "provider": "chronicle",
+            "timeout": 120
+        }
+    }
+    overrides = {
+        "memory": {
+            "provider": "openmemory_mcp"
+        }
+    }
+
+    result = merge_configs(defaults, overrides)
+
+    assert result["memory"]["provider"] == "openmemory_mcp"  # Override
+    assert result["memory"]["timeout"] == 120  # Preserved from defaults
+
+
+def test_merge_configs_deep_nested():
+    """Test deeply nested dictionary merging."""
+    defaults = {
+        "models": {
+            "llm": {
+                "openai": {
+                    "model": "gpt-4o-mini",
+                    "temperature": 0.2,
+                    "max_tokens": 2000
+                }
+            }
+        }
+    }
+    overrides = {
+        "models": {
+            "llm": {
+                "openai": {
+                    "temperature": 0.5
+                }
+            }
+        }
+    }
+
+    result = merge_configs(defaults, overrides)
+
+    assert result["models"]["llm"]["openai"]["model"] == "gpt-4o-mini"  # Preserved
+    assert result["models"]["llm"]["openai"]["temperature"] == 0.5  # Override
+    assert result["models"]["llm"]["openai"]["max_tokens"] == 2000  # Preserved
+
+
+def test_merge_configs_list_replacement():
+    """Test that lists are replaced, not merged."""
+    defaults = {"items": [1, 2, 3]}
+    overrides = {"items": [4, 5]}
+
+    result = merge_configs(defaults, overrides)
+
+    assert result["items"] == [4, 5]  # List replaced entirely
+
+
+def test_merge_configs_empty_override():
+    """Test merging with empty override dictionary."""
+    defaults = {"a": 1, "b": 2}
+    overrides = {}
+
+    result = merge_configs(defaults, overrides)
+
+    assert result["a"] == 1
+    assert result["b"] == 2
+
+
+def test_merge_configs_empty_defaults():
+    """Test merging with empty defaults dictionary."""
+    defaults = {}
+    overrides = {"a": 1, "b": 2}
+
+    result = merge_configs(defaults, overrides)
+
+    assert result["a"] == 1
+    assert result["b"] == 2
+
+
+def test_get_config_structure():
+    """Test that get_config returns expected structure."""
+    config = get_config()
+
+    # Should have main sections
+    assert isinstance(config, dict)
+    assert "defaults" in config or "models" in config  # At least one of these should exist
+
+
+def test_get_config_caching():
+    """Test config caching mechanism."""
+    config1 = get_config()
+    config2 = get_config()
+
+    # Should return cached instance (same object)
+    assert config1 is config2
+
+
+def test_reload_config():
+    """Test config reload invalidates cache."""
+    config1 = get_config()
+    config2 = reload_config()
+
+    # Should be different instances after reload
+    # (Note: Content might be the same, but object should be different)
+    # We check that reload returns a config object
+    assert isinstance(config2, dict)
+
+
+def test_merge_configs_none_handling():
+    """Test handling of None values in merging."""
+    defaults = {"a": 1, "b": None}
+    overrides = {"b": 2, "c": None}
+
+    result = merge_configs(defaults, overrides)
+
+    assert result["a"] == 1
+    assert result["b"] == 2  # Override None with value
+    assert result["c"] is None  # New key with None
+
+
+def test_merge_configs_complex_scenario():
+    """Test complex real-world scenario with mixed types."""
+    defaults = {
+        "defaults": {
+            "llm": "openai-llm",
+            "stt": "stt-deepgram"
+        },
+        "models": [
+            {"name": "model1", "type": "llm"},
+            {"name": "model2", "type": "embedding"}
+        ],
+        "memory": {
+            "provider": "chronicle",
+            "timeout_seconds": 1200,
+            "extraction": {
+                "enabled": True,
+                "prompt": "Default prompt"
+            }
+        }
+    }
+    overrides = {
+        "defaults": {
+            "llm": "local-llm"
+        },
+        "models": [
+            {"name": "model3", "type": "llm"}
+        ],
+        "memory": {
+            "extraction": {
+                "prompt": "Custom prompt"
+            }
+        }
+    }
+
+    result = merge_configs(defaults, overrides)
+
+    # Defaults section merged
+    assert result["defaults"]["llm"] == "local-llm"  # Override
+    assert result["defaults"]["stt"] == "stt-deepgram"  # Preserved
+
+    # Models list replaced
+    assert len(result["models"]) == 1
+    assert result["models"][0]["name"] == "model3"
+
+    # Memory section deeply merged
+    assert result["memory"]["provider"] == "chronicle"  # Preserved
+    assert result["memory"]["timeout_seconds"] == 1200  # Preserved
+    assert result["memory"]["extraction"]["enabled"] is True  # Preserved
+    assert result["memory"]["extraction"]["prompt"] == "Custom prompt"  # Override
+
+
+if __name__ == "__main__":
+    pytest.main([__file__, "-v"])