From a4681c53aa9ddad672bbe7429fa8cd9909ec4253 Mon Sep 17 00:00:00 2001
From: Ankush Malaker <43288948+AnkushMalaker@users.noreply.github.com>
Date: Mon, 19 Jan 2026 17:02:58 +0000
Subject: [PATCH 01/14] Refactor job status handling to align with RQ standards

- Updated job status checks across various modules to use "started" and "finished" instead of "processing" and "completed" for consistency with RQ's naming conventions.
- Adjusted related logging and response messages to reflect the new status terminology.
- Simplified Docker Compose project name handling in test scripts to avoid conflicts and improve clarity in test environment setup.
---
 backends/advanced/docker-compose-test.yml     |   2 +
 backends/advanced/run-test.sh                 |  12 +-
 .../controllers/audio_controller.py           |   6 +-
 .../controllers/queue_controller.py           |  76 +++++++--
 .../controllers/session_controller.py         |  40 ++---
 .../routers/modules/obsidian_routes.py        |   8 +-
 .../routers/modules/queue_routes.py           | 154 ++++++++----------
 .../utils/conversation_utils.py               |  11 ++
 .../advanced_omi_backend/utils/job_utils.py   |   2 +-
 .../workers/audio_jobs.py                     |   2 +-
 .../workers/conversation_jobs.py              |   2 +-
 .../workers/obsidian_jobs.py                  |  18 +-
 .../workers/transcription_jobs.py             |   2 +-
 backends/advanced/upload_files.py             |   8 +-
 backends/advanced/webui/src/pages/Queue.tsx   |  86 +++++-----
 backends/advanced/webui/src/pages/Upload.tsx  |   4 +-
 config/defaults.yml                           |   6 +-
 tests/Makefile                                |  44 +++--
 tests/bin/rebuild-containers.sh               |  44 +----
 tests/bin/save-container-logs.sh              |  14 +-
 tests/bin/start-containers.sh                 |   4 +-
 tests/bin/start-rebuild-containers.sh         |  48 ++++++
 tests/bin/status-containers.sh                |   9 +-
 tests/endpoints/audio_upload_tests.robot      |  10 +-
 tests/endpoints/client_queue_tests.robot      |   4 +-
 tests/endpoints/conversation_tests.robot      |   6 +-
 tests/endpoints/health_tests.robot            |   4 +-
 tests/endpoints/plugin_tests.robot            |   8 +-
 tests/endpoints/rq_queue_tests.robot          |  14 +-
 tests/infrastructure/infra_tests.robot        |   4 +-
 tests/integration/conversation_queue.robot    |   8 +-
 tests/integration/integration_test.robot      |  24 +--
 tests/integration/sdk_tests.robot             |   2 +-
 .../websocket_streaming_tests.robot           |  10 +-
 .../websocket_transcription_e2e_test.robot    |  41 ++---
 tests/resources/audio_keywords.robot          |  18 +-
 tests/resources/conversation_keywords.robot   |   6 +-
 tests/resources/memory_keywords.robot         |  12 +-
 tests/resources/queue_keywords.robot          |  19 ++-
 tests/resources/websocket_keywords.robot      |   4 +-
 tests/run-no-api-tests.sh                     |   9 +-
 tests/run-robot-tests.sh                      |   7 +-
 tests/setup-test-containers.sh                |   9 +-
 tests/setup/test_manager_keywords.robot       |   4 +-
 tests/teardown-test-containers.sh             |   6 +-
 45 files changed, 428 insertions(+), 403 deletions(-)
 create mode 100755 tests/bin/start-rebuild-containers.sh

diff --git a/backends/advanced/docker-compose-test.yml b/backends/advanced/docker-compose-test.yml
index 999b37a2..e89102f5 100644
--- a/backends/advanced/docker-compose-test.yml
+++ b/backends/advanced/docker-compose-test.yml
@@ -2,6 +2,8 @@
 # Isolated test environment for integration tests
 # Uses different ports to avoid conflicts with development environment
 
+name: backend-test
+
 services:
   chronicle-backend-test:
     build:
diff --git a/backends/advanced/run-test.sh b/backends/advanced/run-test.sh
index c68a30ea..61fd7d55 100755
--- a/backends/advanced/run-test.sh
+++ b/backends/advanced/run-test.sh
@@ -219,17 +219,13 @@ if [ -d "./data/test_audio_chunks/" ] || [ -d "./data/test_data/" ] || [ -d "./d
     docker run --rm -v "$(pwd)/data:/data" alpine sh -c 'rm -rf /data/test_*' 2>/dev/null || true
 fi
 
-# Use unique project name to avoid conflicts with development environment
-export COMPOSE_PROJECT_NAME="advanced-backend-test"
+# Note: Project name 'backend-test' is set in docker-compose-test.yml
+# No need to export COMPOSE_PROJECT_NAME - it's handled by the compose file
 
 # Stop any existing test containers
 print_info "Stopping existing test containers..."
-# Try cleanup with current project name
 docker compose -f docker-compose-test.yml down -v || true
 
-# Also try cleanup with default project name (in case containers were started without COMPOSE_PROJECT_NAME)
-COMPOSE_PROJECT_NAME=advanced docker compose -f docker-compose-test.yml down -v 2>/dev/null || true
-
 # Run integration tests
 print_info "Running integration tests..."
 print_info "Using fresh mode (CACHED_MODE=False) for clean testing"
@@ -268,8 +264,6 @@ else
     if [ "${CLEANUP_CONTAINERS:-true}" != "false" ]; then
         print_info "Cleaning up test containers after failure..."
         docker compose -f docker-compose-test.yml down -v || true
-        # Also cleanup with default project name
-        COMPOSE_PROJECT_NAME=advanced docker compose -f docker-compose-test.yml down -v 2>/dev/null || true
         docker system prune -f || true
     else
         print_warning "Skipping cleanup (CLEANUP_CONTAINERS=false) - containers left running for debugging"
@@ -282,8 +276,6 @@ fi
 if [ "${CLEANUP_CONTAINERS:-true}" != "false" ]; then
     print_info "Cleaning up test containers..."
     docker compose -f docker-compose-test.yml down -v || true
-    # Also cleanup with default project name
-    COMPOSE_PROJECT_NAME=advanced docker compose -f docker-compose-test.yml down -v 2>/dev/null || true
     docker system prune -f || true
 else
     print_warning "Skipping cleanup (CLEANUP_CONTAINERS=false) - containers left running"
diff --git a/backends/advanced/src/advanced_omi_backend/controllers/audio_controller.py b/backends/advanced/src/advanced_omi_backend/controllers/audio_controller.py
index 041bd06b..d726a392 100644
--- a/backends/advanced/src/advanced_omi_backend/controllers/audio_controller.py
+++ b/backends/advanced/src/advanced_omi_backend/controllers/audio_controller.py
@@ -203,7 +203,7 @@ async def upload_and_process_audio_files(
 
                 processed_files.append({
                     "filename": file.filename,
-                    "status": "processing",
+                    "status": "started",  # RQ standard: job has been enqueued
                     "conversation_id": conversation_id,
                     "transcript_job_id": transcription_job.id,
                     "speaker_job_id": job_ids['speaker_recognition'],
@@ -233,7 +233,7 @@ async def upload_and_process_audio_files(
                     "error": str(e),
                 })
 
-        successful_files = [f for f in processed_files if f.get("status") == "processing"]
+        successful_files = [f for f in processed_files if f.get("status") == "started"]
         failed_files = [f for f in processed_files if f.get("status") == "error"]
 
         return {
@@ -242,7 +242,7 @@ async def upload_and_process_audio_files(
             "files": processed_files,
             "summary": {
                 "total": len(files),
-                "processing": len(successful_files),
+                "started": len(successful_files),  # RQ standard
                 "failed": len(failed_files),
             },
         }
diff --git a/backends/advanced/src/advanced_omi_backend/controllers/queue_controller.py b/backends/advanced/src/advanced_omi_backend/controllers/queue_controller.py
index 9cd374e0..d804df95 100644
--- a/backends/advanced/src/advanced_omi_backend/controllers/queue_controller.py
+++ b/backends/advanced/src/advanced_omi_backend/controllers/queue_controller.py
@@ -17,7 +17,7 @@
 
 import redis
 from rq import Queue, Worker
-from rq.job import Job
+from rq.job import Job, JobStatus
 from rq.registry import ScheduledJobRegistry, DeferredJobRegistry
 
 from advanced_omi_backend.models.job import JobPriority
@@ -30,6 +30,52 @@
 REDIS_URL = os.getenv("REDIS_URL", "redis://localhost:6379/0")
 redis_conn = redis.from_url(REDIS_URL)
 
+
+def get_job_status_from_rq(job: Job) -> str:
+    """
+    Get job status using RQ's native method.
+
+    Uses job.get_status() which is the Redis Queue standard approach.
+    Returns RQ's standard status names.
+
+    Returns one of: queued, started, finished, failed, deferred, scheduled, canceled, stopped
+
+    Raises:
+        RuntimeError: If job status is unexpected (should never happen with RQ's method)
+    """
+    rq_status = job.get_status()
+
+    # RQ returns status as JobStatus enum or string
+    # Convert to string if it's an enum
+    if isinstance(rq_status, JobStatus):
+        status_str = rq_status.value
+    else:
+        status_str = str(rq_status)
+
+    # Validate it's a known RQ status
+    valid_statuses = {
+        JobStatus.QUEUED.value,
+        JobStatus.STARTED.value,
+        JobStatus.FINISHED.value,
+        JobStatus.FAILED.value,
+        JobStatus.DEFERRED.value,
+        JobStatus.SCHEDULED.value,
+        JobStatus.CANCELED.value,
+        JobStatus.STOPPED.value,
+    }
+
+    if status_str not in valid_statuses:
+        logger.error(
+            f"Job {job.id} has unexpected RQ status: {status_str}. "
+            f"This indicates RQ library added a new status we don't know about."
+        )
+        raise RuntimeError(
+            f"Job {job.id} has unknown RQ status: {status_str}. "
+            f"Please update get_job_status_from_rq() to handle this new status."
+        )
+
+    return status_str
+
 # Queue name constants
 TRANSCRIPTION_QUEUE = "transcription"
 MEMORY_QUEUE = "memory"
@@ -61,34 +107,34 @@ def get_queue(queue_name: str = DEFAULT_QUEUE) -> Queue:
 
 
 def get_job_stats() -> Dict[str, Any]:
-    """Get statistics about jobs in all queues matching frontend expectations."""
+    """Get statistics about jobs in all queues using RQ standard status names."""
     total_jobs = 0
     queued_jobs = 0
-    processing_jobs = 0
-    completed_jobs = 0
+    started_jobs = 0  # RQ standard: "started" not "processing"
+    finished_jobs = 0  # RQ standard: "finished" not "completed"
     failed_jobs = 0
-    cancelled_jobs = 0
+    canceled_jobs = 0  # RQ standard: "canceled" not "cancelled"
     deferred_jobs = 0  # Jobs waiting for dependencies (depends_on)
 
     for queue_name in QUEUE_NAMES:
         queue = get_queue(queue_name)
 
         queued_jobs += len(queue)
-        processing_jobs += len(queue.started_job_registry)
-        completed_jobs += len(queue.finished_job_registry)
+        started_jobs += len(queue.started_job_registry)
+        finished_jobs += len(queue.finished_job_registry)
         failed_jobs += len(queue.failed_job_registry)
-        cancelled_jobs += len(queue.canceled_job_registry)
+        canceled_jobs += len(queue.canceled_job_registry)
         deferred_jobs += len(queue.deferred_job_registry)
 
-    total_jobs = queued_jobs + processing_jobs + completed_jobs + failed_jobs + cancelled_jobs + deferred_jobs
+    total_jobs = queued_jobs + started_jobs + finished_jobs + failed_jobs + canceled_jobs + deferred_jobs
 
     return {
         "total_jobs": total_jobs,
         "queued_jobs": queued_jobs,
-        "processing_jobs": processing_jobs,
-        "completed_jobs": completed_jobs,
+        "started_jobs": started_jobs,
+        "finished_jobs": finished_jobs,
         "failed_jobs": failed_jobs,
-        "cancelled_jobs": cancelled_jobs,
+        "canceled_jobs": canceled_jobs,
         "deferred_jobs": deferred_jobs,
         "timestamp": datetime.utcnow().isoformat()
     }
@@ -124,11 +170,11 @@ def get_jobs(
     for qname in queues_to_check:
         queue = get_queue(qname)
 
-        # Collect jobs from all registries
+        # Collect jobs from all registries (using RQ standard status names)
         registries = [
             (queue.job_ids, "queued"),
-            (queue.started_job_registry.get_job_ids(), "processing"),
-            (queue.finished_job_registry.get_job_ids(), "completed"),
+            (queue.started_job_registry.get_job_ids(), "started"),  # RQ standard, not "processing"
+            (queue.finished_job_registry.get_job_ids(), "finished"),  # RQ standard, not "completed"
             (queue.failed_job_registry.get_job_ids(), "failed"),
             (queue.deferred_job_registry.get_job_ids(), "deferred"),  # Jobs waiting for dependencies
         ]
diff --git a/backends/advanced/src/advanced_omi_backend/controllers/session_controller.py b/backends/advanced/src/advanced_omi_backend/controllers/session_controller.py
index d1a22695..165bb4c3 100644
--- a/backends/advanced/src/advanced_omi_backend/controllers/session_controller.py
+++ b/backends/advanced/src/advanced_omi_backend/controllers/session_controller.py
@@ -57,11 +57,11 @@ async def mark_session_complete(
     """
     session_key = f"audio:session:{session_id}"
     await redis_client.hset(session_key, mapping={
-        "status": "complete",
+        "status": "finished",
         "completed_at": str(time.time()),
         "completion_reason": reason
     })
-    logger.info(f"✅ Session {session_id[:12]} marked complete: {reason}")
+    logger.info(f"✅ Session {session_id[:12]} marked finished: {reason}")
 
 
 async def get_session_info(redis_client, session_id: str) -> Optional[Dict]:
@@ -231,15 +231,15 @@ async def get_streaming_status(request):
             # Check if all jobs are complete (including failed jobs)
             all_jobs_done = all_jobs_complete_for_session(session_id)
 
-            # Session is completed if:
-            # 1. Redis status says complete/finalized AND all jobs done, OR
-            # 2. All jobs are done (even if status isn't complete yet)
-            # This ensures sessions with failed jobs move to completed
-            if status in ["complete", "completed", "finalized"] or all_jobs_done:
+            # Session is finished if:
+            # 1. Redis status says finished AND all jobs done, OR
+            # 2. All jobs are done (even if status isn't finished yet)
+            # This ensures sessions with failed jobs move to finished
+            if status == "finished" or all_jobs_done:
                 if all_jobs_done:
-                    # All jobs complete - this is truly a completed session
-                    # Update Redis status if it wasn't already marked complete
-                    if status not in ["complete", "completed", "finalized"]:
+                    # All jobs finished - this is truly a finished session
+                    # Update Redis status if it wasn't already marked finished
+                    if status != "finished":
                         await mark_session_complete(redis_client, session_id, "all_jobs_complete")
 
                     # Get additional session data for completed sessions
@@ -251,7 +251,7 @@ async def get_streaming_status(request):
                         "client_id": session_obj.get("client_id", ""),
                         "conversation_id": session_data.get(b"conversation_id", b"").decode() if session_data and b"conversation_id" in session_data else None,
                         "has_conversation": bool(session_data and session_data.get(b"conversation_id", b"")),
-                        "action": session_data.get(b"action", b"complete").decode() if session_data and b"action" in session_data else "complete",
+                        "action": session_data.get(b"action", b"finished").decode() if session_data and b"action" in session_data else "finished",
                         "reason": session_data.get(b"reason", b"").decode() if session_data and b"reason" in session_data else "",
                         "completed_at": session_obj.get("last_chunk_at", 0),
                         "audio_file": session_data.get(b"audio_file", b"").decode() if session_data and b"audio_file" in session_data else "",
@@ -450,26 +450,26 @@ async def get_streaming_status(request):
         rq_stats = {
             "transcription_queue": {
                 "queued": transcription_queue.count,
-                "processing": len(transcription_queue.started_job_registry),
-                "completed": len(transcription_queue.finished_job_registry),
+                "started": len(transcription_queue.started_job_registry),
+                "finished": len(transcription_queue.finished_job_registry),
                 "failed": len(transcription_queue.failed_job_registry),
-                "cancelled": len(transcription_queue.canceled_job_registry),
+                "canceled": len(transcription_queue.canceled_job_registry),
                 "deferred": len(transcription_queue.deferred_job_registry)
             },
             "memory_queue": {
                 "queued": memory_queue.count,
-                "processing": len(memory_queue.started_job_registry),
-                "completed": len(memory_queue.finished_job_registry),
+                "started": len(memory_queue.started_job_registry),
+                "finished": len(memory_queue.finished_job_registry),
                 "failed": len(memory_queue.failed_job_registry),
-                "cancelled": len(memory_queue.canceled_job_registry),
+                "canceled": len(memory_queue.canceled_job_registry),
                 "deferred": len(memory_queue.deferred_job_registry)
             },
             "default_queue": {
                 "queued": default_queue.count,
-                "processing": len(default_queue.started_job_registry),
-                "completed": len(default_queue.finished_job_registry),
+                "started": len(default_queue.started_job_registry),
+                "finished": len(default_queue.finished_job_registry),
                 "failed": len(default_queue.failed_job_registry),
-                "cancelled": len(default_queue.canceled_job_registry),
+                "canceled": len(default_queue.canceled_job_registry),
                 "deferred": len(default_queue.deferred_job_registry)
             }
         }
diff --git a/backends/advanced/src/advanced_omi_backend/routers/modules/obsidian_routes.py b/backends/advanced/src/advanced_omi_backend/routers/modules/obsidian_routes.py
index e45c51de..f6a46a38 100644
--- a/backends/advanced/src/advanced_omi_backend/routers/modules/obsidian_routes.py
+++ b/backends/advanced/src/advanced_omi_backend/routers/modules/obsidian_routes.py
@@ -176,14 +176,12 @@ async def get_status(job_id: str, current_user: User = Depends(current_active_us
         status = job.get_status()
         if status == "started":
             status = "running"
-        if status == "canceled":
-            status = "cancelled"
-            
+
         # Get metadata
         meta = job.meta or {}
-        
+
         # If meta has status, prefer it (for granular updates)
-        if "status" in meta and meta["status"] in ("running", "completed", "failed", "cancelled"):
+        if "status" in meta and meta["status"] in ("running", "finished", "failed", "canceled"):
              status = meta["status"]
 
         total = meta.get("total_files", 0)
diff --git a/backends/advanced/src/advanced_omi_backend/routers/modules/queue_routes.py b/backends/advanced/src/advanced_omi_backend/routers/modules/queue_routes.py
index 8dd9e5f6..14c7ee0e 100644
--- a/backends/advanced/src/advanced_omi_backend/routers/modules/queue_routes.py
+++ b/backends/advanced/src/advanced_omi_backend/routers/modules/queue_routes.py
@@ -9,7 +9,7 @@
 from typing import List, Optional
 
 from advanced_omi_backend.auth import current_active_user
-from advanced_omi_backend.controllers.queue_controller import get_jobs, get_job_stats, redis_conn, QUEUE_NAMES
+from advanced_omi_backend.controllers.queue_controller import get_jobs, get_job_stats, redis_conn, QUEUE_NAMES, get_job_status_from_rq
 from advanced_omi_backend.users import User
 from rq.job import Job
 import redis.asyncio as aioredis
@@ -65,18 +65,12 @@ async def get_job_status(
             if job_user_id != str(current_user.user_id):
                 raise HTTPException(status_code=403, detail="Access forbidden")
 
-        # Determine status from registries
-        status = "unknown"
-        if job.is_queued:
-            status = "queued"
-        elif job.is_started:
-            status = "processing"
-        elif job.is_finished:
-            status = "completed"
-        elif job.is_failed:
-            status = "failed"
-        elif job.is_deferred:
-            status = "deferred"
+        # Get status using RQ's native method
+        try:
+            status = get_job_status_from_rq(job)
+        except RuntimeError as e:
+            logger.error(f"Failed to determine status for job {job_id}: {e}")
+            raise HTTPException(status_code=500, detail=str(e))
 
         return {
             "job_id": job.id,
@@ -106,18 +100,12 @@ async def get_job(
             if job_user_id != str(current_user.user_id):
                 raise HTTPException(status_code=403, detail="Access forbidden")
 
-        # Determine status from registries
-        status = "unknown"
-        if job.is_queued:
-            status = "queued"
-        elif job.is_started:
-            status = "processing"
-        elif job.is_finished:
-            status = "completed"
-        elif job.is_failed:
-            status = "failed"
-        elif job.is_deferred:
-            status = "deferred"
+        # Get status using RQ's native method
+        try:
+            status = get_job_status_from_rq(job)
+        except RuntimeError as e:
+            logger.error(f"Failed to determine status for job {job_id}: {e}")
+            raise HTTPException(status_code=500, detail=str(e))
 
         return {
             "job_id": job.id,
@@ -157,18 +145,18 @@ async def cancel_job(
             if job_user_id != str(current_user.user_id):
                 raise HTTPException(status_code=403, detail="Access forbidden")
 
-        # Cancel if queued or processing, delete if completed/failed
+        # Cancel if queued or started, delete if finished/failed
         if job.is_queued or job.is_started or job.is_deferred or job.is_scheduled:
             # Cancel the job
             job.cancel()
             logger.info(f"Cancelled job {job_id}")
             return {
                 "job_id": job_id,
-                "action": "cancelled",
-                "message": f"Job {job_id} has been cancelled"
+                "action": "canceled",
+                "message": f"Job {job_id} has been canceled"
             }
         else:
-            # Delete completed/failed jobs
+            # Delete finished/failed jobs
             job.delete()
             logger.info(f"Deleted job {job_id}")
             return {
@@ -182,7 +170,7 @@ async def cancel_job(
         raise
     except Exception as e:
         logger.error(f"Failed to cancel/delete job {job_id}: {e}")
-        raise HTTPException(status_code=404, detail=f"Job not found or could not be cancelled: {str(e)}")
+        raise HTTPException(status_code=404, detail=f"Job not found or could not be canceled: {str(e)}")
 
 
 @router.get("/jobs/by-client/{client_id}")
@@ -201,21 +189,14 @@ async def get_jobs_by_client(
         queues = QUEUE_NAMES
 
         def get_job_status(job, registries_map):
-            """Determine job status from registries."""
-            if job.is_queued:
-                return "queued"
-            elif job.is_started:
-                return "processing"
-            elif job.is_finished:
-                return "completed"
-            elif job.is_failed:
-                return "failed"
-            elif job.is_deferred:
-                return "deferred"
-            elif job.is_scheduled:
-                return "waiting"
-            else:
-                return "unknown"
+            """Determine job status using RQ's native method."""
+            try:
+                return get_job_status_from_rq(job)
+            except RuntimeError:
+                # In nested function, can't raise HTTP exception
+                # Log and re-raise to be handled by outer scope
+                logger.error(f"Job {job.id} status determination failed")
+                raise
 
         def process_job_and_dependents(job, queue_name, base_status):
             """Process a job and recursively find all its dependents."""
@@ -270,15 +251,15 @@ def process_job_and_dependents(job, queue_name, base_status):
         for queue_name in queues:
             queue = get_queue(queue_name)
 
-            # Check all registries
+            # Check all registries (using RQ standard status names)
             registries = [
                 ("queued", queue.job_ids),
-                ("processing", StartedJobRegistry(queue=queue).get_job_ids()),
-                ("completed", FinishedJobRegistry(queue=queue).get_job_ids()),
+                ("started", StartedJobRegistry(queue=queue).get_job_ids()),  # RQ standard
+                ("finished", FinishedJobRegistry(queue=queue).get_job_ids()),  # RQ standard
                 ("failed", FailedJobRegistry(queue=queue).get_job_ids()),
-                ("cancelled", CanceledJobRegistry(queue=queue).get_job_ids()),
-                ("waiting", DeferredJobRegistry(queue=queue).get_job_ids()),
-                ("waiting", ScheduledJobRegistry(queue=queue).get_job_ids())
+                ("canceled", CanceledJobRegistry(queue=queue).get_job_ids()),  # RQ standard (US spelling)
+                ("deferred", DeferredJobRegistry(queue=queue).get_job_ids()),
+                ("scheduled", ScheduledJobRegistry(queue=queue).get_job_ids())
             ]
 
             for status_name, job_ids in registries:
@@ -329,7 +310,7 @@ async def get_queue_stats_endpoint(
 
     except Exception as e:
         logger.error(f"Failed to get queue stats: {e}")
-        return {"total_jobs": 0, "queued_jobs": 0, "processing_jobs": 0, "completed_jobs": 0, "failed_jobs": 0, "cancelled_jobs": 0, "deferred_jobs": 0}
+        return {"total_jobs": 0, "queued_jobs": 0, "started_jobs": 0, "finished_jobs": 0, "failed_jobs": 0, "canceled_jobs": 0, "deferred_jobs": 0}
 
 
 @router.get("/worker-details")
@@ -480,13 +461,13 @@ async def get_stream_info(stream_key):
 
 class FlushJobsRequest(BaseModel):
     older_than_hours: int = 24
-    statuses: List[str] = ["completed", "failed", "cancelled"]
+    statuses: List[str] = ["finished", "failed", "canceled"]  # RQ standard status names
 
 
 class FlushAllJobsRequest(BaseModel):
     confirm: bool
     include_failed: bool = False  # By default, preserve failed jobs for debugging
-    include_completed: bool = False  # By default, preserve completed jobs for debugging
+    include_finished: bool = False  # By default, preserve finished jobs for debugging
 
 
 @router.post("/flush")
@@ -512,8 +493,8 @@ async def flush_jobs(
         for queue_name in queues:
             queue = get_queue(queue_name)
 
-            # Flush from appropriate registries based on requested statuses
-            if "completed" in request.statuses:
+            # Flush from appropriate registries based on requested statuses (RQ standard names)
+            if "finished" in request.statuses:  # RQ standard, not "completed"
                 registry = FinishedJobRegistry(queue=queue)
                 for job_id in registry.get_job_ids():
                     try:
@@ -535,7 +516,7 @@ async def flush_jobs(
                     except Exception as e:
                         logger.error(f"Error deleting job {job_id}: {e}")
 
-            if "cancelled" in request.statuses:
+            if "canceled" in request.statuses:  # RQ standard (US spelling), not "cancelled"
                 registry = CanceledJobRegistry(queue=queue)
                 for job_id in registry.get_job_ids():
                     try:
@@ -564,8 +545,8 @@ async def flush_all_jobs(
 ):
     """
     Flush jobs from queues and registries.
-    By default preserves failed and completed jobs for debugging.
-    Set include_failed=true or include_completed=true to flush those as well.
+    By default preserves failed and finished jobs for debugging.
+    Set include_failed=true or include_finished=true to flush those as well.
     """
     if not current_user.is_superuser:
         raise HTTPException(status_code=403, detail="Admin access required")
@@ -607,7 +588,7 @@ async def flush_all_jobs(
             # Conditionally add failed and finished registries
             if request.include_failed:
                 registries.append(("failed", FailedJobRegistry(queue=queue)))
-            if request.include_completed:
+            if request.include_finished:
                 registries.append(("finished", FinishedJobRegistry(queue=queue)))
 
             for registry_name, registry in registries:
@@ -691,8 +672,8 @@ async def flush_all_jobs(
         preserved = []
         if not request.include_failed:
             preserved.append("failed jobs")
-        if not request.include_completed:
-            preserved.append("completed jobs")
+        if not request.include_finished:
+            preserved.append("finished jobs")
 
         preserved_msg = f" (preserved {', '.join(preserved)})" if preserved else ""
         logger.info(f"Flushed {total_removed} jobs and {deleted_keys} Redis keys from all queues{preserved_msg}")
@@ -833,7 +814,7 @@ async def get_dashboard_data(
     """Get all data needed for the Queue dashboard in a single API call.
 
     Returns:
-    - Jobs grouped by status (queued, processing, completed, failed)
+    - Jobs grouped by status (queued, started, finished, failed)
     - Queue statistics
     - Streaming status
     - Client jobs for expanded clients
@@ -858,12 +839,12 @@ async def fetch_jobs_by_status(status_name: str, limit: int = 100):
                 for queue_name in queues:
                     queue = get_queue(queue_name)
 
-                    # Get job IDs based on status
+                    # Get job IDs based on status (using RQ standard status names)
                     if status_name == "queued":
                         job_ids = queue.job_ids[:limit]
-                    elif status_name == "processing":
+                    elif status_name == "started":  # RQ standard, not "processing"
                         job_ids = list(StartedJobRegistry(queue=queue).get_job_ids())[:limit]
-                    elif status_name == "completed":
+                    elif status_name == "finished":  # RQ standard, not "completed"
                         job_ids = list(FinishedJobRegistry(queue=queue).get_job_ids())[:limit]
                     elif status_name == "failed":
                         job_ids = list(FailedJobRegistry(queue=queue).get_job_ids())[:limit]
@@ -917,7 +898,7 @@ async def fetch_stats():
                 return get_job_stats()
             except Exception as e:
                 logger.error(f"Error fetching stats: {e}")
-                return {"total_jobs": 0, "queued_jobs": 0, "processing_jobs": 0, "completed_jobs": 0, "failed_jobs": 0}
+                return {"total_jobs": 0, "queued_jobs": 0, "started_jobs": 0, "finished_jobs": 0, "failed_jobs": 0}
 
         async def fetch_streaming_status():
             """Fetch streaming status."""
@@ -941,17 +922,12 @@ async def fetch_client_jobs(client_id: str):
                 queues = QUEUE_NAMES
 
                 def get_job_status(job):
-                    if job.is_queued:
-                        return "queued"
-                    elif job.is_started:
-                        return "processing"
-                    elif job.is_finished:
-                        return "completed"
-                    elif job.is_failed:
-                        return "failed"
-                    elif job.is_deferred:
-                        return "deferred"
-                    else:
+                    """Get job status using RQ's native method."""
+                    try:
+                        return get_job_status_from_rq(job)
+                    except RuntimeError:
+                        logger.error(f"Job {job.id} status determination failed")
+                        # Return unknown as fallback in dashboard context
                         return "unknown"
 
                 # Find all jobs for this session
@@ -966,8 +942,8 @@ def get_job_status(job):
 
                     registries = [
                         ("queued", queue.job_ids),
-                        ("processing", StartedJobRegistry(queue=queue).get_job_ids()),
-                        ("completed", FinishedJobRegistry(queue=queue).get_job_ids()),
+                        ("started", StartedJobRegistry(queue=queue).get_job_ids()),  # RQ standard
+                        ("finished", FinishedJobRegistry(queue=queue).get_job_ids()),  # RQ standard
                         ("failed", FailedJobRegistry(queue=queue).get_job_ids())
                     ]
 
@@ -1016,10 +992,10 @@ def get_job_status(job):
                 logger.error(f"Error fetching jobs for client {client_id}: {e}")
                 return {"client_id": client_id, "jobs": []}
 
-        # Execute all fetches in parallel
+        # Execute all fetches in parallel (using RQ standard status names)
         queued_jobs_task = fetch_jobs_by_status("queued", limit=100)
-        processing_jobs_task = fetch_jobs_by_status("processing", limit=100)
-        completed_jobs_task = fetch_jobs_by_status("completed", limit=50)
+        started_jobs_task = fetch_jobs_by_status("started", limit=100)  # RQ standard, not "processing"
+        finished_jobs_task = fetch_jobs_by_status("finished", limit=50)  # RQ standard, not "completed"
         failed_jobs_task = fetch_jobs_by_status("failed", limit=50)
         stats_task = fetch_stats()
         streaming_status_task = fetch_streaming_status()
@@ -1027,8 +1003,8 @@ def get_job_status(job):
 
         results = await asyncio.gather(
             queued_jobs_task,
-            processing_jobs_task,
-            completed_jobs_task,
+            started_jobs_task,
+            finished_jobs_task,
             failed_jobs_task,
             stats_task,
             streaming_status_task,
@@ -1037,8 +1013,8 @@ def get_job_status(job):
         )
 
         queued_jobs = results[0] if not isinstance(results[0], Exception) else []
-        processing_jobs = results[1] if not isinstance(results[1], Exception) else []
-        completed_jobs = results[2] if not isinstance(results[2], Exception) else []
+        started_jobs = results[1] if not isinstance(results[1], Exception) else []  # RQ standard
+        finished_jobs = results[2] if not isinstance(results[2], Exception) else []  # RQ standard
         failed_jobs = results[3] if not isinstance(results[3], Exception) else []
         stats = results[4] if not isinstance(results[4], Exception) else {"total_jobs": 0}
         streaming_status = results[5] if not isinstance(results[5], Exception) else {"active_sessions": []}
@@ -1066,8 +1042,8 @@ def get_job_status(job):
         return {
             "jobs": {
                 "queued": queued_jobs,
-                "processing": processing_jobs,
-                "completed": completed_jobs,
+                "started": started_jobs,  # RQ standard status name
+                "finished": finished_jobs,  # RQ standard status name
                 "failed": failed_jobs
             },
             "stats": stats,
diff --git a/backends/advanced/src/advanced_omi_backend/utils/conversation_utils.py b/backends/advanced/src/advanced_omi_backend/utils/conversation_utils.py
index ca62372b..c0f92408 100644
--- a/backends/advanced/src/advanced_omi_backend/utils/conversation_utils.py
+++ b/backends/advanced/src/advanced_omi_backend/utils/conversation_utils.py
@@ -81,6 +81,10 @@ def analyze_speech(transcript_data: dict) -> dict:
     settings = get_speech_detection_settings()
     words = transcript_data.get("words", [])
 
+    logger.info(f"🔬 analyze_speech: words_list_length={len(words)}, settings={settings}")
+    if words and len(words) > 0:
+        logger.info(f"📝 First 3 words: {words[:3]}")
+
     # Method 1: Word-level analysis (preferred - has confidence scores and timing)
     if words:
         # Filter by confidence threshold
@@ -98,6 +102,12 @@ def analyze_speech(transcript_data: dict) -> dict:
                 speech_end = valid_words[-1].get("end", 0)
                 speech_duration = speech_end - speech_start
 
+                # Debug logging for timestamp investigation
+                logger.info(
+                    f"🕐 Speech timing: start={speech_start:.2f}s, end={speech_end:.2f}s, "
+                    f"duration={speech_duration:.2f}s (first_word={valid_words[0]}, last_word={valid_words[-1]})"
+                )
+
                 # If no timing data (duration = 0), fall back to text-only analysis
                 # This happens with some streaming transcription services
                 if speech_duration == 0:
@@ -106,6 +116,7 @@ def analyze_speech(transcript_data: dict) -> dict:
                 else:
                     # Check minimum duration threshold when we have timing data
                     min_duration = settings.get("min_duration", 10.0)
+                    logger.info(f"📏 Comparing duration {speech_duration:.1f}s vs threshold {min_duration:.1f}s")
                     if speech_duration < min_duration:
                         return {
                             "has_speech": False,
diff --git a/backends/advanced/src/advanced_omi_backend/utils/job_utils.py b/backends/advanced/src/advanced_omi_backend/utils/job_utils.py
index ba9fcc74..c9028909 100644
--- a/backends/advanced/src/advanced_omi_backend/utils/job_utils.py
+++ b/backends/advanced/src/advanced_omi_backend/utils/job_utils.py
@@ -44,7 +44,7 @@ async def check_job_alive(redis_client, current_job, session_id: Optional[str] =
             if session_id:
                 session_key = f"audio:session:{session_id}"
                 session_status = await redis_client.hget(session_key, "status")
-                if session_status and session_status.decode() in ["finalizing", "complete", "closed"]:
+                if session_status and session_status.decode() in ["finalizing", "finished"]:
                     # Session ended naturally - not a zombie, just natural cleanup
                     logger.debug(f"📋 Job {current_job.id} ending naturally (session closed)")
                     return False
diff --git a/backends/advanced/src/advanced_omi_backend/workers/audio_jobs.py b/backends/advanced/src/advanced_omi_backend/workers/audio_jobs.py
index 58acad62..8505d547 100644
--- a/backends/advanced/src/advanced_omi_backend/workers/audio_jobs.py
+++ b/backends/advanced/src/advanced_omi_backend/workers/audio_jobs.py
@@ -210,7 +210,7 @@ async def flush_pcm_buffer():
 
         # Check if session is finalizing
         session_status = await redis_client.hget(session_key, "status")
-        if session_status and session_status.decode() in ["finalizing", "complete"]:
+        if session_status and session_status.decode() in ["finalizing", "finished"]:
             logger.info(f"🛑 Session finalizing detected, flushing final chunks...")
             await asyncio.sleep(0.5)  # Brief wait for in-flight chunks
 
diff --git a/backends/advanced/src/advanced_omi_backend/workers/conversation_jobs.py b/backends/advanced/src/advanced_omi_backend/workers/conversation_jobs.py
index e458a7fe..8edc01e4 100644
--- a/backends/advanced/src/advanced_omi_backend/workers/conversation_jobs.py
+++ b/backends/advanced/src/advanced_omi_backend/workers/conversation_jobs.py
@@ -315,7 +315,7 @@ async def open_conversation_job(
             status = await redis_client.hget(session_key, "status")
             status_str = status.decode() if status else None
 
-            if status_str in ["finalizing", "complete"]:
+            if status_str in ["finalizing", "finished"]:
                 finalize_received = True
 
                 # Get completion reason (guaranteed to exist with unified API)
diff --git a/backends/advanced/src/advanced_omi_backend/workers/obsidian_jobs.py b/backends/advanced/src/advanced_omi_backend/workers/obsidian_jobs.py
index 1956f00b..8c67616d 100644
--- a/backends/advanced/src/advanced_omi_backend/workers/obsidian_jobs.py
+++ b/backends/advanced/src/advanced_omi_backend/workers/obsidian_jobs.py
@@ -34,7 +34,7 @@ async def ingest_obsidian_vault_job(job_id: str, vault_path: str, redis_client=N
     logger.info("Starting Obsidian ingestion job %s", job.id)
 
     # Initialize job meta
-    job.meta["status"] = "processing"
+    job.meta["status"] = "started"
     job.meta["processed"] = 0
     job.meta["total_files"] = 0
     job.meta["errors"] = []
@@ -74,10 +74,10 @@ async def ingest_obsidian_vault_job(job_id: str, vault_path: str, redis_client=N
             # Check for cancellation
             job.refresh()
             if job.get_status() == "canceled":
-                logger.info("Obsidian ingestion job %s cancelled by user", job.id)
-                job.meta["status"] = "cancelled"
+                logger.info("Obsidian ingestion job %s canceled by user", job.id)
+                job.meta["status"] = "canceled"
                 job.save_meta()
-                return {"status": "cancelled"}
+                return {"status": "canceled"}
 
             try:
                 note_data = obsidian_service.parse_obsidian_note(root, filename, vault_path)
@@ -96,12 +96,12 @@ async def ingest_obsidian_vault_job(job_id: str, vault_path: str, redis_client=N
                 job.meta["errors"] = errors
                 job.save_meta()
 
-    job.meta["status"] = "completed"
+    job.meta["status"] = "finished"
     job.save_meta()
-    
+
     return {
-        "status": "completed", 
-        "processed": processed, 
-        "total": total, 
+        "status": "finished",
+        "processed": processed,
+        "total": total,
         "errors": errors
     }
diff --git a/backends/advanced/src/advanced_omi_backend/workers/transcription_jobs.py b/backends/advanced/src/advanced_omi_backend/workers/transcription_jobs.py
index 70935e1a..f492c910 100644
--- a/backends/advanced/src/advanced_omi_backend/workers/transcription_jobs.py
+++ b/backends/advanced/src/advanced_omi_backend/workers/transcription_jobs.py
@@ -612,7 +612,7 @@ async def stream_speech_detection_job(
 
         # Check if session has closed
         session_status = await redis_client.hget(session_key, "status")
-        session_closed = session_status and session_status.decode() in ["complete", "closed"]
+        session_closed = session_status and session_status.decode() in ["finalizing", "finished"]
 
         if session_closed and session_closed_at is None:
             # Session just closed - start grace period for final transcription
diff --git a/backends/advanced/upload_files.py b/backends/advanced/upload_files.py
index ead58e74..77a001f3 100755
--- a/backends/advanced/upload_files.py
+++ b/backends/advanced/upload_files.py
@@ -321,14 +321,14 @@ def poll_job_status(job_id: str, token: str, base_url: str, total_files: int) ->
                 last_progress = progress
                 last_current_file = current_file
             
-            # Check completion status
-            if status == "completed":
+            # Check completion status (RQ standard: "finished")
+            if status == "finished":
                 elapsed = time.time() - start_time
                 logger.info(f"🎉 Job completed successfully in {elapsed:.0f}s!")
-                
+
                 # Show final file status summary
                 files = job_status.get("files", [])
-                completed = len([f for f in files if f.get("status") == "completed"])
+                completed = len([f for f in files if f.get("status") == "finished"])
                 failed = len([f for f in files if f.get("status") == "failed"])
                 skipped = len([f for f in files if f.get("status") == "skipped"])
                 
diff --git a/backends/advanced/webui/src/pages/Queue.tsx b/backends/advanced/webui/src/pages/Queue.tsx
index 05b56fb6..b05f9374 100644
--- a/backends/advanced/webui/src/pages/Queue.tsx
+++ b/backends/advanced/webui/src/pages/Queue.tsx
@@ -27,10 +27,10 @@ import { queueApi } from '../services/api';
 interface QueueStats {
   total_jobs: number;
   queued_jobs: number;
-  processing_jobs: number;
-  completed_jobs: number;
+  started_jobs: number;  // RQ standard, not "processing_jobs"
+  finished_jobs: number;  // RQ standard, not "completed_jobs"
   failed_jobs: number;
-  cancelled_jobs: number;
+  canceled_jobs: number;  // RQ standard (US spelling), not "cancelled_jobs"
   deferred_jobs: number;
   timestamp: string;
 }
@@ -131,10 +131,10 @@ const Queue: React.FC = () => {
   const [showFlushModal, setShowFlushModal] = useState(false);
   const [flushSettings, setFlushSettings] = useState({
     older_than_hours: 24,
-    statuses: ['completed', 'failed'],
+    statuses: ['finished', 'failed'],  // RQ standard status names
     flush_all: false,
     include_failed: false,  // For flush_all mode
-    include_completed: false  // For flush_all mode
+    include_completed: false  // For flush_all mode (note: API expects include_completed for backward compat)
   });
   const [flushing, setFlushing] = useState(false);
   const [expandedConversations, setExpandedConversations] = useState<Set<string>>(new Set());
@@ -186,19 +186,19 @@ const Queue: React.FC = () => {
       const response = await queueApi.getDashboard(expandedConversationIds);
       const dashboardData = response.data;
 
-      // Extract jobs from response
+      // Extract jobs from response (using RQ standard status names)
       const queuedJobs = dashboardData.jobs.queued || [];
-      const processingJobs = dashboardData.jobs.processing || [];
-      const completedJobs = dashboardData.jobs.completed || [];
+      const startedJobs = dashboardData.jobs.started || [];  // RQ standard, not "processing"
+      const finishedJobs = dashboardData.jobs.finished || [];  // RQ standard, not "completed"
       const failedJobs = dashboardData.jobs.failed || [];
 
       // Combine all jobs
-      const allFetchedJobs = [...queuedJobs, ...processingJobs, ...completedJobs, ...failedJobs];
+      const allFetchedJobs = [...queuedJobs, ...startedJobs, ...finishedJobs, ...failedJobs];
 
       console.log(`📊 Fetched ${allFetchedJobs.length} total jobs via consolidated endpoint`);
       console.log(`  - Queued: ${queuedJobs.length}`);
-      console.log(`  - Processing: ${processingJobs.length}`);
-      console.log(`  - Completed: ${completedJobs.length}`);
+      console.log(`  - Started: ${startedJobs.length}`);  // RQ standard
+      console.log(`  - Finished: ${finishedJobs.length}`);  // RQ standard
       console.log(`  - Failed: ${failedJobs.length}`);
 
       // Debug: Log open_conversation_job details
@@ -266,7 +266,7 @@ const Queue: React.FC = () => {
       // Find all conversations with active open_conversation_job
       Object.entries(jobsByConversation).forEach(([_conversationId, jobs]) => {
         const openConvJob = jobs.find((j: any) => j.job_type === 'open_conversation_job');
-        if (openConvJob && openConvJob.status === 'processing') {
+        if (openConvJob && openConvJob.status === 'started') {
           const conversationId = openConvJob.meta?.conversation_id;
           if (conversationId && !expandedConversations.has(conversationId)) {
             newExpanded.add(conversationId);
@@ -441,12 +441,12 @@ const Queue: React.FC = () => {
   const getStatusIcon = (status: string) => {
     switch (status) {
       case 'queued': return <Clock className="w-4 h-4" />;
-      case 'processing': return <Play className="w-4 h-4 animate-pulse" />;
-      case 'completed': return <CheckCircle className="w-4 h-4" />;
+      case 'started': return <Play className="w-4 h-4 animate-pulse" />;  // RQ standard
+      case 'finished': return <CheckCircle className="w-4 h-4" />;  // RQ standard
       case 'failed': return <XCircle className="w-4 h-4" />;
-      case 'cancelled': return <StopCircle className="w-4 h-4" />;
+      case 'canceled': return <StopCircle className="w-4 h-4" />;  // RQ standard (US spelling)
       case 'deferred': return <Pause className="w-4 h-4" />;
-      case 'waiting': return <Pause className="w-4 h-4" />;
+      case 'scheduled': return <Pause className="w-4 h-4" />;  // RQ standard, not "waiting"
       default: return <Clock className="w-4 h-4" />;
     }
   };
@@ -454,12 +454,12 @@ const Queue: React.FC = () => {
   const getStatusColor = (status: string) => {
     switch (status) {
       case 'queued': return 'text-yellow-600 bg-yellow-100';
-      case 'processing': return 'text-blue-600 bg-blue-100';
-      case 'completed': return 'text-green-600 bg-green-100';
+      case 'started': return 'text-blue-600 bg-blue-100';  // RQ standard
+      case 'finished': return 'text-green-600 bg-green-100';  // RQ standard
       case 'failed': return 'text-red-600 bg-red-100';
-      case 'cancelled': return 'text-gray-600 bg-gray-100';
+      case 'canceled': return 'text-gray-600 bg-gray-100';  // RQ standard (US spelling)
       case 'deferred': return 'text-blue-600 bg-blue-100';
-      case 'waiting': return 'text-blue-600 bg-blue-100';
+      case 'scheduled': return 'text-blue-600 bg-blue-100';  // RQ standard, not "waiting"
       default: return 'text-gray-600 bg-gray-100';
     }
   };
@@ -536,7 +536,7 @@ const Queue: React.FC = () => {
       borderColor = 'border-red-600';
     }
     // Processing jobs - add pulse animation
-    else if (status === 'processing') {
+    else if (status === 'started') {
       bgColor = bgColor + ' animate-pulse';
     }
 
@@ -634,7 +634,7 @@ const Queue: React.FC = () => {
     // For failed/finished jobs, use completed_at or ended_at. For running jobs, use current time.
     const end = job.completed_at || job.ended_at
       ? new Date((job.completed_at || job.ended_at)!).getTime()
-      : (job.status === 'processing' ? Date.now() : start); // Don't show increasing time for failed jobs
+      : (job.status === 'started' ? Date.now() : start); // Don't show increasing time for failed jobs
     const durationMs = end - start;
 
     if (durationMs < 1000) return `${durationMs}ms`;
@@ -758,10 +758,10 @@ const Queue: React.FC = () => {
 
           <div className="bg-white rounded-lg border p-4">
             <div className="flex items-center space-x-2">
-              <Play className={`w-5 h-5 text-blue-600 ${stats.processing_jobs > 0 ? 'animate-pulse' : ''}`} />
+              <Play className={`w-5 h-5 text-blue-600 ${stats.started_jobs > 0 ? 'animate-pulse' : ''}`} />
               <div>
-                <p className="text-sm text-gray-600">Processing</p>
-                <p className="text-xl font-semibold text-blue-600">{stats.processing_jobs}</p>
+                <p className="text-sm text-gray-600">Started</p>
+                <p className="text-xl font-semibold text-blue-600">{stats.started_jobs}</p>
               </div>
             </div>
           </div>
@@ -770,8 +770,8 @@ const Queue: React.FC = () => {
             <div className="flex items-center space-x-2">
               <CheckCircle className="w-5 h-5 text-green-600" />
               <div>
-                <p className="text-sm text-gray-600">Completed</p>
-                <p className="text-xl font-semibold text-green-600">{stats.completed_jobs}</p>
+                <p className="text-sm text-gray-600">Finished</p>
+                <p className="text-xl font-semibold text-green-600">{stats.finished_jobs}</p>
               </div>
             </div>
           </div>
@@ -790,8 +790,8 @@ const Queue: React.FC = () => {
             <div className="flex items-center space-x-2">
               <StopCircle className="w-5 h-5 text-gray-600" />
               <div>
-                <p className="text-sm text-gray-600">Cancelled</p>
-                <p className="text-xl font-semibold text-gray-600">{stats.cancelled_jobs}</p>
+                <p className="text-sm text-gray-600">Canceled</p>
+                <p className="text-xl font-semibold text-gray-600">{stats.canceled_jobs}</p>
               </div>
             </div>
           </div>
@@ -890,7 +890,7 @@ const Queue: React.FC = () => {
                   const allListenJobs = allJobs.filter((job: any) =>
                     job && job.job_type === 'stream_speech_detection_job' &&
                     job.meta?.client_id === clientId &&
-                    job.status !== 'completed' &&
+                    job.status !== 'finished' &&
                     job.status !== 'failed'
                   );
 
@@ -1092,7 +1092,7 @@ const Queue: React.FC = () => {
                   // Filter to only show conversations where at least one job is NOT completed
                   const conversationMap = new Map<string, any[]>();
                   allConversationJobs.forEach((jobs, conversationId) => {
-                    const hasActiveJob = jobs.some(j => j.status !== 'completed' && j.status !== 'failed');
+                    const hasActiveJob = jobs.some(j => j.status !== 'finished' && j.status !== 'failed');
                     if (hasActiveJob) {
                       conversationMap.set(conversationId, jobs);
                     }
@@ -1211,7 +1211,7 @@ const Queue: React.FC = () => {
                                       const startTime = new Date(job.started_at!).getTime();
                                       const endTime = job.completed_at || job.ended_at
                                         ? new Date((job.completed_at || job.ended_at)!).getTime()
-                                        : (job.status === 'processing' ? Date.now() : startTime);
+                                        : (job.status === 'started' ? Date.now() : startTime);
 
                                       return {
                                         job,
@@ -1299,7 +1299,7 @@ const Queue: React.FC = () => {
                                               <div className="flex-1 relative h-6 bg-gray-100 rounded">
                                                 {/* Job Bar */}
                                                 <div
-                                                  className={`absolute h-6 rounded ${barColor} ${job.status === 'processing' ? 'animate-pulse' : ''} flex items-center justify-center`}
+                                                  className={`absolute h-6 rounded ${barColor} ${job.status === 'started' ? 'animate-pulse' : ''} flex items-center justify-center`}
                                                   style={{
                                                     left: `${startPercent}%`,
                                                     width: `${widthPercent}%`
@@ -1533,7 +1533,7 @@ const Queue: React.FC = () => {
                   // Filter to only show conversations where ALL jobs are completed or failed
                   const conversationMap = new Map<string, any[]>();
                   allConversationJobs.forEach((jobs, conversationId) => {
-                    const allJobsComplete = jobs.every(j => j.status === 'completed' || j.status === 'failed');
+                    const allJobsComplete = jobs.every(j => j.status === 'finished' || j.status === 'failed');
                     if (allJobsComplete) {
                       conversationMap.set(conversationId, jobs);
                     }
@@ -1604,7 +1604,7 @@ const Queue: React.FC = () => {
                         const summary = transcriptionMeta.summary || null;
 
                         // Check job statuses
-                        const allComplete = jobs.every(j => j.status === 'completed');
+                        const allComplete = jobs.every(j => j.status === 'finished');
                         const hasFailedJob = jobs.some(j => j.status === 'failed');
                         const failedJobCount = jobs.filter(j => j.status === 'failed').length;
 
@@ -1730,7 +1730,7 @@ const Queue: React.FC = () => {
                                         const startTime = new Date(job.started_at!).getTime();
                                         const endTime = job.completed_at || job.ended_at
                                           ? new Date((job.completed_at || job.ended_at)!).getTime()
-                                          : (job.status === 'processing' ? Date.now() : startTime);
+                                          : (job.status === 'started' ? Date.now() : startTime);
 
                                         return {
                                           job,
@@ -1818,7 +1818,7 @@ const Queue: React.FC = () => {
                                                 <div className="flex-1 relative h-6 bg-gray-100 rounded">
                                                   {/* Job Bar */}
                                                   <div
-                                                    className={`absolute h-6 rounded ${barColor} ${job.status === 'processing' ? 'animate-pulse' : ''} flex items-center justify-center`}
+                                                    className={`absolute h-6 rounded ${barColor} ${job.status === 'started' ? 'animate-pulse' : ''} flex items-center justify-center`}
                                                     style={{
                                                       left: `${startPercent}%`,
                                                       width: `${widthPercent}%`
@@ -2034,10 +2034,10 @@ const Queue: React.FC = () => {
             >
               <option value="">All Statuses</option>
               <option value="queued">Queued</option>
-              <option value="processing">Processing</option>
-              <option value="completed">Completed</option>
+              <option value="started">Started</option>
+              <option value="finished">Finished</option>
               <option value="failed">Failed</option>
-              <option value="cancelled">Cancelled</option>
+              <option value="canceled">Canceled</option>
               <option value="deferred">Deferred</option>
             </select>
           </div>
@@ -2158,7 +2158,7 @@ const Queue: React.FC = () => {
                       >
                         <Eye className="w-4 h-4" />
                       </button>
-                      {(job.status === 'queued' || job.status === 'processing') && (
+                      {(job.status === 'queued' || job.status === 'started') && (
                         <button
                           onClick={() => cancelJob(job.job_id)}
                           className="text-red-600 hover:text-red-900"
@@ -2167,7 +2167,7 @@ const Queue: React.FC = () => {
                           <StopCircle className="w-4 h-4" />
                         </button>
                       )}
-                      {job.status === 'completed' && (
+                      {job.status === 'finished' && (
                         <button
                           onClick={() => cancelJob(job.job_id)}
                           className="text-gray-400 hover:text-gray-600"
@@ -2500,7 +2500,7 @@ const Queue: React.FC = () => {
                       <div>
                         <label className="block text-xs text-gray-600 mb-1">Job statuses to remove:</label>
                         <div className="space-y-1">
-                          {['completed', 'failed', 'cancelled'].map(status => (
+                          {['finished', 'failed', 'canceled'].map(status => (
                             <label key={status} className="flex items-center space-x-2">
                               <input
                                 type="checkbox"
diff --git a/backends/advanced/webui/src/pages/Upload.tsx b/backends/advanced/webui/src/pages/Upload.tsx
index 7c0e12bf..6c22f4e7 100644
--- a/backends/advanced/webui/src/pages/Upload.tsx
+++ b/backends/advanced/webui/src/pages/Upload.tsx
@@ -193,9 +193,9 @@ export default function Upload() {
         try {
           const res = await obsidianApi.status(obsidianJobId)
           setObsidianStatus(res.data)
-          if (res.data.status === 'completed' || res.data.status === 'failed') {
+          if (res.data.status === 'finished' || res.data.status === 'failed') {
             setObsidianPolling(false)
-            setObsidianMessage(res.data.status === 'completed' ? '✅ Ingestion completed' : `❌ Failed: ${res.data.error || 'unknown error'}`)
+            setObsidianMessage(res.data.status === 'finished' ? '✅ Ingestion completed' : `❌ Failed: ${res.data.error || 'unknown error'}`)
           }
         } catch (err) {
           setObsidianPolling(false)
diff --git a/config/defaults.yml b/config/defaults.yml
index 8398881e..b3f5a8f0 100644
--- a/config/defaults.yml
+++ b/config/defaults.yml
@@ -334,9 +334,9 @@ backend:
 
   # Speech detection thresholds
   speech_detection:
-    min_words: 10              # Minimum words to create conversation
-    min_confidence: 0.7        # Word confidence threshold
-    min_duration: 10.0         # Minimum speech duration in seconds
+    min_words: ${oc.decode:${oc.env:SPEECH_DETECTION_MIN_WORDS,10}}              # Minimum words to create conversation
+    min_confidence: ${oc.decode:${oc.env:SPEECH_DETECTION_MIN_CONFIDENCE,0.7}}        # Word confidence threshold
+    min_duration: ${oc.decode:${oc.env:SPEECH_DETECTION_MIN_DURATION,10.0}}         # Minimum speech duration in seconds
 
   # Conversation stop conditions
   conversation_stop:
diff --git a/tests/Makefile b/tests/Makefile
index f1a52793..feff61a2 100644
--- a/tests/Makefile
+++ b/tests/Makefile
@@ -3,8 +3,8 @@
 
 .PHONY: help all clean \
         containers-start containers-stop containers-restart containers-rebuild \
-        containers-clean containers-status containers-logs \
-        start stop restart rebuild status logs \
+        containers-start-rebuild containers-clean containers-status containers-logs \
+        start stop restart rebuild start-rebuild status logs \
         test test-quick test-slow test-sdk test-all-with-slow-and-sdk clean-all
 
 # Default output directory
@@ -16,11 +16,14 @@ help:
 	@echo "Chronicle Test Targets:"
 	@echo ""
 	@echo "Quick Commands:"
-	@echo "  make test        - Start containers + run all tests (excludes slow/sdk)"
-	@echo "  make test-quick  - Run tests on existing containers"
-	@echo "  make start       - Start test containers"
-	@echo "  make stop        - Stop containers (keep volumes)"
-	@echo "  make status      - Show container status"
+	@echo "  make test          - Start containers + run all tests (excludes slow/sdk)"
+	@echo "  make test-quick    - Run tests on existing containers"
+	@echo "  make start         - Start test containers"
+	@echo "  make stop          - Stop containers (keep volumes)"
+	@echo "  make restart       - Restart containers (for .env changes)"
+	@echo "  make rebuild       - Rebuild images only (doesn't start)"
+	@echo "  make start-rebuild - Stop + rebuild + start (for code changes)"
+	@echo "  make status        - Show container status"
 	@echo ""
 	@echo "Running Tests:"
 	@echo "  make all         - Run all tests (excludes slow/sdk)"
@@ -34,13 +37,14 @@ help:
 	@echo "  make test-all-with-slow-and-sdk   - Run ALL tests including excluded"
 	@echo ""
 	@echo "Container Management:"
-	@echo "  make containers-start    - Start test containers"
-	@echo "  make containers-stop     - Stop containers (keep volumes)"
-	@echo "  make containers-restart  - Restart containers"
-	@echo "  make containers-rebuild  - Rebuild + restart containers"
-	@echo "  make containers-clean    - Save logs + remove everything"
-	@echo "  make containers-status   - Show container health"
-	@echo "  make containers-logs     - View service logs (use SERVICE=name)"
+	@echo "  make containers-start         - Start test containers"
+	@echo "  make containers-stop          - Stop containers (keep volumes)"
+	@echo "  make containers-restart       - Restart containers (config changes)"
+	@echo "  make containers-rebuild       - Rebuild images only"
+	@echo "  make containers-start-rebuild - Stop + rebuild + start (code changes)"
+	@echo "  make containers-clean         - Save logs + remove everything"
+	@echo "  make containers-status        - Show container health"
+	@echo "  make containers-logs          - View service logs (use SERVICE=name)"
 	@echo ""
 	@echo "Utilities:"
 	@echo "  make clean       - Remove test output files"
@@ -51,8 +55,9 @@ help:
 	@echo "  SERVICE          - Service name for logs (default: chronicle-backend-test)"
 	@echo ""
 	@echo "Examples:"
-	@echo "  make test                              # Full workflow"
-	@echo "  make endpoints                         # Only endpoint tests"
+	@echo "  make test                                  # Full workflow"
+	@echo "  make endpoints                             # Only endpoint tests"
+	@echo "  make start-rebuild                         # After code changes"
 	@echo "  make containers-logs SERVICE=workers-test  # View worker logs"
 
 # Run all tests (excludes slow and sdk tests for faster feedback)
@@ -117,10 +122,14 @@ containers-stop:
 containers-restart:
 	@./bin/restart-containers.sh
 
-# Rebuild test containers
+# Rebuild test containers (images only)
 containers-rebuild:
 	@./bin/rebuild-containers.sh
 
+# Stop, rebuild, and start test containers
+containers-start-rebuild:
+	@./bin/start-rebuild-containers.sh
+
 # Clean test containers (ALWAYS saves logs first!)
 containers-clean:
 	@./bin/clean-containers.sh
@@ -141,6 +150,7 @@ start: containers-start
 stop: containers-stop
 restart: containers-restart
 rebuild: containers-rebuild
+start-rebuild: containers-start-rebuild
 status: containers-status
 logs: containers-logs
 
diff --git a/tests/bin/rebuild-containers.sh b/tests/bin/rebuild-containers.sh
index a9b798a6..827e544e 100755
--- a/tests/bin/rebuild-containers.sh
+++ b/tests/bin/rebuild-containers.sh
@@ -1,6 +1,6 @@
 #!/bin/bash
 # tests/bin/rebuild-containers.sh
-# Stop, rebuild, and start containers (for code changes)
+# Rebuild test container images (does not start containers)
 
 set -e
 
@@ -9,40 +9,14 @@ BACKEND_DIR="$SCRIPT_DIR/../../backends/advanced"
 
 cd "$BACKEND_DIR"
 
-echo "🔨 Rebuilding test containers..."
-echo "   This will:"
-echo "   1. Stop containers"
-echo "   2. Rebuild images with latest code"
-echo "   3. Start containers"
+echo "🔨 Rebuilding test container images..."
+echo "   This will only rebuild images, not start containers."
+echo "   Use 'make start' to start containers after rebuild."
 echo ""
 
-# Stop containers
-echo "🛑 Stopping containers..."
-docker compose -f docker-compose-test.yml stop
+# Build images
+echo "🏗️  Building images..."
+docker compose -f docker-compose-test.yml build
 
-# Rebuild and start
-echo "🏗️  Rebuilding images..."
-docker compose -f docker-compose-test.yml up -d --build
-
-# Wait for services
-echo "⏳ Waiting for services to be ready..."
-sleep 5
-
-# Health check
-MAX_RETRIES=30
-RETRY_COUNT=0
-while [ $RETRY_COUNT -lt $MAX_RETRIES ]; do
-    if curl -s http://localhost:8001/health > /dev/null 2>&1; then
-        echo "✅ Backend is healthy"
-        break
-    fi
-    RETRY_COUNT=$((RETRY_COUNT + 1))
-    if [ $RETRY_COUNT -eq $MAX_RETRIES ]; then
-        echo "❌ Backend health check failed after $MAX_RETRIES attempts"
-        exit 1
-    fi
-    echo "   Waiting for backend... ($RETRY_COUNT/$MAX_RETRIES)"
-    sleep 2
-done
-
-echo "✅ Test containers rebuilt and running"
+echo "✅ Test container images rebuilt successfully"
+echo "   Run 'make start' to start the containers"
diff --git a/tests/bin/save-container-logs.sh b/tests/bin/save-container-logs.sh
index 5e8782a8..14f68be9 100755
--- a/tests/bin/save-container-logs.sh
+++ b/tests/bin/save-container-logs.sh
@@ -13,17 +13,9 @@ mkdir -p "$LOG_DIR"
 
 echo "📝 Saving container logs to logs/$TIMESTAMP/"
 
-# Get project name from .env.test or use default
-ENV_FILE="$SCRIPT_DIR/../setup/.env.test"
-PROJECT_NAME="advanced-backend-test"  # Default
-
-if [ -f "$ENV_FILE" ]; then
-    # Try to read COMPOSE_PROJECT_NAME from .env.test
-    FOUND_NAME=$(grep COMPOSE_PROJECT_NAME "$ENV_FILE" | cut -d= -f2)
-    if [ -n "$FOUND_NAME" ]; then
-        PROJECT_NAME="$FOUND_NAME"
-    fi
-fi
+# Get project name (from docker-compose-test.yml)
+# The project name is set in the compose file as 'backend-test'
+PROJECT_NAME="backend-test"
 
 # Service list (based on docker-compose-test.yml)
 SERVICES="chronicle-backend-test workers-test mongo-test redis-test qdrant-test speaker-service-test"
diff --git a/tests/bin/start-containers.sh b/tests/bin/start-containers.sh
index 75c96577..a2f33602 100755
--- a/tests/bin/start-containers.sh
+++ b/tests/bin/start-containers.sh
@@ -10,8 +10,8 @@ BACKEND_DIR="$TESTS_DIR/../backends/advanced"
 
 cd "$BACKEND_DIR"
 
-# Set COMPOSE_PROJECT_NAME for test containers
-export COMPOSE_PROJECT_NAME="${COMPOSE_PROJECT_NAME:-advanced-backend-test}"
+# Note: Project name 'backend-test' is set in docker-compose-test.yml
+# No need to export COMPOSE_PROJECT_NAME - it's handled by the compose file
 
 echo "🚀 Starting test containers..."
 
diff --git a/tests/bin/start-rebuild-containers.sh b/tests/bin/start-rebuild-containers.sh
new file mode 100755
index 00000000..cc348f0d
--- /dev/null
+++ b/tests/bin/start-rebuild-containers.sh
@@ -0,0 +1,48 @@
+#!/bin/bash
+# tests/bin/start-rebuild-containers.sh
+# Stop, rebuild, and start containers (full sequence for code changes)
+
+set -e
+
+SCRIPT_DIR="$(cd "$(dirname "$0")" && pwd)"
+BACKEND_DIR="$SCRIPT_DIR/../../backends/advanced"
+
+cd "$BACKEND_DIR"
+
+echo "🔨 Rebuilding and starting test containers..."
+echo "   This will:"
+echo "   1. Stop containers"
+echo "   2. Rebuild images with latest code"
+echo "   3. Start containers"
+echo ""
+
+# Stop containers
+echo "🛑 Stopping containers..."
+docker compose -f docker-compose-test.yml stop
+
+# Rebuild and start
+echo "🏗️  Rebuilding images..."
+docker compose -f docker-compose-test.yml up -d --build
+
+# Wait for services
+echo "⏳ Waiting for services to be ready..."
+sleep 5
+
+# Health check
+MAX_RETRIES=30
+RETRY_COUNT=0
+while [ $RETRY_COUNT -lt $MAX_RETRIES ]; do
+    if curl -s http://localhost:8001/health > /dev/null 2>&1; then
+        echo "✅ Backend is healthy"
+        break
+    fi
+    RETRY_COUNT=$((RETRY_COUNT + 1))
+    if [ $RETRY_COUNT -eq $MAX_RETRIES ]; then
+        echo "❌ Backend health check failed after $MAX_RETRIES attempts"
+        exit 1
+    fi
+    echo "   Waiting for backend... ($RETRY_COUNT/$MAX_RETRIES)"
+    sleep 2
+done
+
+echo "✅ Test containers rebuilt and running"
diff --git a/tests/bin/status-containers.sh b/tests/bin/status-containers.sh
index 4ca962cf..89344731 100755
--- a/tests/bin/status-containers.sh
+++ b/tests/bin/status-containers.sh
@@ -7,12 +7,9 @@ set -e
 SCRIPT_DIR="$(cd "$(dirname "$0")" && pwd)"
 ENV_FILE="$SCRIPT_DIR/../setup/.env.test"
 
-# Get project name
-if [ -f "$ENV_FILE" ]; then
-    PROJECT_NAME=$(grep COMPOSE_PROJECT_NAME "$ENV_FILE" | cut -d= -f2 || echo "advanced-backend-test")
-else
-    PROJECT_NAME="advanced-backend-test"
-fi
+# Get project name (from docker-compose-test.yml)
+# The project name is set in the compose file as 'backend-test'
+PROJECT_NAME="backend-test"
 
 echo "📊 Test Container Status"
 echo "━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━"
diff --git a/tests/endpoints/audio_upload_tests.robot b/tests/endpoints/audio_upload_tests.robot
index 090d84c3..7290f150 100644
--- a/tests/endpoints/audio_upload_tests.robot
+++ b/tests/endpoints/audio_upload_tests.robot
@@ -110,7 +110,7 @@ Multiple Audio Files Upload Test
     # Verify summary
     Dictionary Should Contain Key    ${upload_response}    summary
     Should Be Equal As Integers    ${upload_response}[summary][total]    2    msg=Expected 2 files uploaded
-    Should Be Equal As Integers    ${upload_response}[summary][processing]    2    msg=Expected 2 files processing
+    Should Be Equal As Integers    ${upload_response}[summary][started]    2    msg=Expected 2 files started
 
     # Verify both files are in response
     ${files}=    Set Variable    ${upload_response}[files]
@@ -120,8 +120,8 @@ Multiple Audio Files Upload Test
     # Wait for both transcriptions to complete
     FOR    ${file}    IN    @{files}
         ${transcript_job_id}=    Set Variable    ${file}[transcript_job_id]
-        Wait Until Keyword Succeeds    60s    5s    Check Job Status    ${transcript_job_id}    completed
-        Log To Console    ✅ File ${file}[filename] transcription completed
+        Wait Until Keyword Succeeds    60s    5s    Check Job Status    ${transcript_job_id}    finished
+        Log To Console    ✅ File ${file}[filename] transcription finished
     END
 
     Log To Console    ✅ Uploaded and processed ${file_count} audio files
@@ -157,7 +157,7 @@ Invalid File Upload Test
 
     # Verify file was rejected
     Should Be Equal As Integers    ${upload_response}[summary][failed]    1    msg=Expected 1 file to fail
-    Should Be Equal As Integers    ${upload_response}[summary][processing]    0    msg=Expected 0 files processing
+    Should Be Equal As Integers    ${upload_response}[summary][started]    0    msg=Expected 0 files started
 
     # Verify error message mentions WAV files
     ${error_msg}=    Set Variable    ${upload_response}[files][0][error]
@@ -243,5 +243,5 @@ Audio Upload Job Tracking Test
     Should Be True    ${segment_count} > 0    msg=Should have at least one segment
 
     Log To Console    ✅ Job chain verified
-    Log To Console    📝 Transcription: completed
+    Log To Console    📝 Transcription: finished
     Log To Console    💬 Segments: ${segment_count}
diff --git a/tests/endpoints/client_queue_tests.robot b/tests/endpoints/client_queue_tests.robot
index dd8016da..b161b7fa 100644
--- a/tests/endpoints/client_queue_tests.robot
+++ b/tests/endpoints/client_queue_tests.robot
@@ -88,8 +88,8 @@ Get Queue Statistics Test
 
     ${stats}=      Set Variable    ${response.json()}
     Dictionary Should Contain Key    ${stats}    queued_jobs
-    Dictionary Should Contain Key    ${stats}    processing_jobs
-    Dictionary Should Contain Key    ${stats}    completed_jobs
+    Dictionary Should Contain Key    ${stats}    started_jobs
+    Dictionary Should Contain Key    ${stats}    finished_jobs
     Dictionary Should Contain Key    ${stats}    failed_jobs
 
 
diff --git a/tests/endpoints/conversation_tests.robot b/tests/endpoints/conversation_tests.robot
index 9e2583d0..b1a15938 100644
--- a/tests/endpoints/conversation_tests.robot
+++ b/tests/endpoints/conversation_tests.robot
@@ -59,7 +59,7 @@ Reprocess test and get Conversation Versions Test
 
     # Wait for the reprocess job to complete before getting versions
     ${job_id}=    Set Variable    ${reprocess}[job_id]
-    Wait For Job Status    ${job_id}    completed    timeout=120s    interval=5s
+    Wait For Job Status    ${job_id}    finished    timeout=120s    interval=5s
 
     ${conversation}=           Get Conversation By ID       ${conversation_id}
     ${updated_versions}=           Get Conversation Versions     ${conversation_id}
@@ -111,7 +111,7 @@ Reprocess Memory Test
 
     # Wait for job to complete
     ${job_id}=    Set Variable    ${response}[job_id]
-    Wait For Job Status    ${job_id}    completed    timeout=60s    interval=5s
+    Wait For Job Status    ${job_id}    finished    timeout=60s    interval=5s
 
     # Verify new memory version was created
     ${updated_conversation}=    Get Conversation By ID    ${conversation_id}
@@ -171,7 +171,7 @@ Transcript Version activate Test
         ${reprocess}=    Reprocess Transcript     ${conversation_id}
         # Wait for the reprocess job to complete before getting versions
         ${job_id}=    Set Variable    ${reprocess}[job_id]
-        Wait For Job Status    ${job_id}    completed    timeout=120s    interval=5s
+        Wait For Job Status    ${job_id}    finished    timeout=120s    interval=5s
     END
 
     # Get fresh version list after reprocessing
diff --git a/tests/endpoints/health_tests.robot b/tests/endpoints/health_tests.robot
index e8ee45ec..dc734496 100644
--- a/tests/endpoints/health_tests.robot
+++ b/tests/endpoints/health_tests.robot
@@ -151,8 +151,8 @@ Queue Stats Test
     ${stats}=          Set Variable    ${response.json()}
     Dictionary Should Contain Key    ${stats}    total_jobs
     Dictionary Should Contain Key    ${stats}    queued_jobs
-    Dictionary Should Contain Key    ${stats}    processing_jobs
-    Dictionary Should Contain Key    ${stats}    completed_jobs
+    Dictionary Should Contain Key    ${stats}    started_jobs
+    Dictionary Should Contain Key    ${stats}    finished_jobs
     Dictionary Should Contain Key    ${stats}    failed_jobs
     Dictionary Should Contain Key    ${stats}    timestamp
 
diff --git a/tests/endpoints/plugin_tests.robot b/tests/endpoints/plugin_tests.robot
index d496f012..2ba58aa0 100644
--- a/tests/endpoints/plugin_tests.robot
+++ b/tests/endpoints/plugin_tests.robot
@@ -97,13 +97,13 @@ Batch Transcription Should Trigger Batch Event
     [Documentation]    Verify batch transcription conditions transcript.batch event
     [Tags]    audio-upload	requires-api-keys
 
-    # Upload audio file for batch processing
+    # Upload audio file for batch started
     ${result}=    Upload Single Audio File
 
     # Skip test if audio file not available
     Skip If    ${result}[successful] == 0    Test audio file not available
 
-    # Verify processing completed
+    # Verify started finished
     Should Be True    ${result}[successful] > 0
     ...    msg=At least one file should be processed successfully
 
@@ -128,7 +128,7 @@ Streaming Transcription Should Trigger Streaming Event
 
 *** Keywords ***
 Upload Single Audio File
-    [Documentation]    Upload a single test audio file for batch processing
+    [Documentation]    Upload a single test audio file for batch started
 
     # Get test audio file path
     ${test_audio}=    Set Variable    ${CURDIR}/../../extras/test-audios/short-test.wav
@@ -141,7 +141,7 @@ Upload Single Audio File
         RETURN    ${result}
     END
 
-    # Upload file for processing
+    # Upload file for started
     # Note: This requires authenticated session and proper endpoint
     # Implementation depends on your audio upload endpoint
     ${result}=    Create Dictionary    successful=1    message=Upload simulation
diff --git a/tests/endpoints/rq_queue_tests.robot b/tests/endpoints/rq_queue_tests.robot
index a76376f2..f2d6ce7c 100644
--- a/tests/endpoints/rq_queue_tests.robot
+++ b/tests/endpoints/rq_queue_tests.robot
@@ -136,7 +136,7 @@ Test Multiple Jobs Persistence
         END
     END
 
-    # At least some jobs should persist (they may have completed during restart)
+    # At least some jobs should persist (they may have finished during restart)
     Should Be True    ${persisted_count} >= 0
     Log    ${persisted_count} out of ${job_count} jobs persisted through restart
 
@@ -161,25 +161,25 @@ Test Queue Stats Accuracy
 
     # Verify stats API returns valid structure
     ${stats}=    Get Queue Stats
-    Dictionary Should Contain Key    ${stats}    processing_jobs
+    Dictionary Should Contain Key    ${stats}    started_jobs
     Dictionary Should Contain Key    ${stats}    queued_jobs
-    Dictionary Should Contain Key    ${stats}    completed_jobs
+    Dictionary Should Contain Key    ${stats}    finished_jobs
     Dictionary Should Contain Key    ${stats}    failed_jobs
 
     # Verify all stats are non-negative integers
-    Should Be True    ${stats}[processing_jobs] >= 0
+    Should Be True    ${stats}[started_jobs] >= 0
     Should Be True    ${stats}[queued_jobs] >= 0
-    Should Be True    ${stats}[completed_jobs] >= 0
+    Should Be True    ${stats}[finished_jobs] >= 0
     Should Be True    ${stats}[failed_jobs] >= 0
 
     Log    Queue stats API is working correctly: ${stats}
 
     # Wait for OUR specific jobs to complete (don't rely on global counts)
     FOR    ${job_id}    IN    @{created_jobs}
-        Wait For Job Status    ${job_id}    completed    timeout=60s    interval=2s
+        Wait For Job Status    ${job_id}    finished    timeout=60s    interval=2s
     END
 
-    Log    All ${job_count} created jobs completed successfully
+    Log    All ${job_count} created jobs finished successfully
 
 Test Queue API Authentication
     [Documentation]    Test that queue endpoints properly enforce authentication
diff --git a/tests/infrastructure/infra_tests.robot b/tests/infrastructure/infra_tests.robot
index 41a99de8..35cbe967 100644
--- a/tests/infrastructure/infra_tests.robot
+++ b/tests/infrastructure/infra_tests.robot
@@ -102,7 +102,7 @@ Worker Registration Loss Detection Test
     [Documentation]    Test that the system can automatically recover when workers lose Redis registration
     ...
     ...                This test simulates the exact failure scenario experienced:
-    ...                1. Workers are running and processing jobs
+    ...                1. Workers are running and started jobs
     ...                2. Workers lose Redis registration (Redis restart, network issue, etc.)
     ...                3. Health endpoint should detect 0 workers
     ...                4. Workers should still be running in container
@@ -312,7 +312,7 @@ WebSocket Disconnect Conversation End Reason Test
     # Wait for job to complete (should be fast, not 3600s timeout)
     ${conv_jobs}=    Get Jobs By Type And Client    open_conversation    ${device_name}
     ${conv_job}=    Get Most Recent Job    ${conv_jobs}
-    Wait For Job Status    ${conv_job}[job_id]    completed    timeout=60s    interval=2s
+    Wait For Job Status    ${conv_job}[job_id]    finished    timeout=60s    interval=2s
 
     # Wait for end_reason to be saved to database (retry with timeout)
     ${conversation}=    Wait Until Keyword Succeeds    10s    0.5s
diff --git a/tests/integration/conversation_queue.robot b/tests/integration/conversation_queue.robot
index 2716bf75..e0a3b283 100644
--- a/tests/integration/conversation_queue.robot
+++ b/tests/integration/conversation_queue.robot
@@ -77,8 +77,8 @@ Test Reprocess Conversation Job Queue
 
     Log    Created conversation: ${conversation_id}    INFO
 
-    # Wait for initial upload processing to complete (transcription job chain)
-    Log    Waiting for initial conversation processing to complete...    INFO
+    # Wait for initial upload started to complete (transcription job chain)
+    Log    Waiting for initial conversation started to complete...    INFO
     Sleep    10s    # Give time for initial job chain (transcription -> speaker -> memory)
 
     # Get conversation to verify initial state
@@ -96,9 +96,9 @@ Test Reprocess Conversation Job Queue
     ${version_id}=    Set Variable    ${reprocess_data}[version_id]
 
 
-    # Wait for transcription job to complete (Deepgram API + processing takes time in CI)
+    # Wait for transcription job to complete (Deepgram API + started takes time in CI)
     Log    Waiting for transcription job ${job_id} to complete...    INFO
-    Wait For Job Status    ${job_id}    completed    timeout=60s    interval=3s
+    Wait For Job Status    ${job_id}    finished    timeout=60s    interval=3s
 
     # Verify conversation was updated with new transcript version
     ${updated_conversation}=    Get Conversation By ID    ${conversation_id}
diff --git a/tests/integration/integration_test.robot b/tests/integration/integration_test.robot
index e8ef6563..31ebd747 100644
--- a/tests/integration/integration_test.robot
+++ b/tests/integration/integration_test.robot
@@ -22,7 +22,7 @@ Test Setup       Clear Test Databases
 
 *** Test Cases ***
 Full Pipeline Integration Test
-    [Documentation]    Complete end-to-end test of audio processing pipeline
+    [Documentation]    Complete end-to-end test of audio started pipeline
     [Tags]    e2e	requires-api-keys
     [Timeout]          600s
 
@@ -30,10 +30,10 @@ Full Pipeline Integration Test
 
    
     # Phase 4: Audio Processing - Upload and wait for conversation completion
-    Log    Starting audio upload and processing    INFO
+    Log    Starting audio upload and started    INFO
     ${conversation}=    Upload Audio File    ${TEST_AUDIO_FILE}    ${TEST_DEVICE_NAME}
 
-    Log    Audio processing completed, conversation created    INFO
+    Log    Audio started finished, conversation created    INFO
     Set Global Variable    ${TEST_CONVERSATION}    ${conversation}
 
     # Phase 5: Transcription Verification
@@ -60,8 +60,8 @@ Audio Playback And Segment Timing Test
 
     Log    Conversation created: ${conversation_id}    INFO
 
-    # Wait for post-processing jobs to complete
-    Sleep    10s    Wait for post-processing jobs
+    # Wait for post-started jobs to complete
+    Sleep    10s    Wait for post-started jobs
 
     # Refresh conversation data
     ${conversation}=    Get Conversation By ID    ${conversation_id}
@@ -116,15 +116,15 @@ Audio Playback And Segment Timing Test
 
 End To End Pipeline With Memory Validation Test
     [Documentation]    Complete E2E test with memory extraction and OpenAI quality validation.
-    ...                Provides comprehensive integration testing of the entire audio processing pipeline.
+    ...                Provides comprehensive integration testing of the entire audio started pipeline.
     ...                Separate from other tests to avoid breaking existing upload-only tests.
     [Tags]    e2e	memory
     [Timeout]    600s
 
     Log    Starting End-to-End Pipeline Test with Memory Validation    INFO
 
-    # Phase 1: Upload audio and wait for complete processing
-    Log    Uploading audio file and waiting for full processing    INFO
+    # Phase 1: Upload audio and wait for complete started
+    Log    Uploading audio file and waiting for full started    INFO
     ${conversation}    ${memories}=    Upload Audio File And Wait For Memory
     ...    ${TEST_AUDIO_FILE}
     ...    ${TEST_DEVICE_NAME}
@@ -196,7 +196,7 @@ Verify Memory Extraction
 
     Log    Verifying memory extraction    INFO
 
-    # Check if conversation has memory count (may still be processing)
+    # Check if conversation has memory count (may still be started)
     ${has_memory_count}=    Run Keyword And Return Status    Dictionary Should Contain Key    ${conversation}    memory_count
     ${memory_count}=    Run Keyword If    ${has_memory_count}
     ...    Set Variable    ${conversation}[memory_count]
@@ -212,11 +212,11 @@ Verify Memory Extraction
 
     ${api_memory_count}=    Get Length    ${memories}
 
-    # Verify memory extraction status (allow for memory processing to be in progress)
+    # Verify memory extraction status (allow for memory started to be in progress)
     Should Be True    ${memory_count} >= 0    Memory count is negative
     Should Be True    ${api_memory_count} >= 0    API memory count is negative
 
-    Log    Memory extraction verification passed (may still be processing)    INFO
+    Log    Memory extraction verification passed (may still be started)    INFO
     Log    Conversation memory count: ${memory_count}, API memory count: ${api_memory_count}    INFO
 
 Verify Chat Integration
@@ -252,6 +252,6 @@ Verify Chat Integration
     ${response}=    DELETE On Session    ${session_alias}    /api/chat/sessions/${session_id}    expected_status=any
     Should Be True    ${response.status_code} in [200, 204]    Chat session deletion failed with status ${response.status_code}
 
-    Log    Chat integration verification completed    INFO
+    Log    Chat integration verification finished    INFO
 
 
diff --git a/tests/integration/sdk_tests.robot b/tests/integration/sdk_tests.robot
index 1bbe5b6f..047047b3 100644
--- a/tests/integration/sdk_tests.robot
+++ b/tests/integration/sdk_tests.robot
@@ -44,7 +44,7 @@ SDK Can Upload Audio File
     ...    ${CURDIR}/../scripts/sdk_test_upload.py
     ...    ${BACKEND_URL}    ${ADMIN_EMAIL}    ${ADMIN_PASSWORD}    ${test_audio}
     Should Be Equal As Integers    ${result.rc}    0    SDK upload should succeed
-    Should Contain    ${result.stdout}    STATUS:processing    File should be in processing status
+    Should Contain    ${result.stdout}    STATUS:started    File should be in started status
 
 SDK Can Retrieve Conversations
     [Documentation]    Test SDK conversation retrieval
diff --git a/tests/integration/websocket_streaming_tests.robot b/tests/integration/websocket_streaming_tests.robot
index baa357fa..18dbcaa5 100644
--- a/tests/integration/websocket_streaming_tests.robot
+++ b/tests/integration/websocket_streaming_tests.robot
@@ -72,7 +72,7 @@ Conversation Job Created After Speech Detection
     Send Audio Chunks To Stream    ${stream_id}    ${TEST_AUDIO_FILE}    num_chunks=200    realtime_pacing=True
 
     # Wait for open_conversation job to be created (transcription + speech analysis takes time)
-    # Deepgram/OpenAI API calls + job processing can take 30-60s with queue
+    # Deepgram/OpenAI API calls + job started can take 30-60s with queue
     Wait Until Keyword Succeeds    60s    3s
     ...    Job Type Exists For Client    open_conversation    ${client_id}
 
@@ -137,10 +137,10 @@ Conversation Closes On Inactivity Timeout And Restarts Speech Detection
     # The conversation should auto-close after SPEECH_INACTIVITY_THRESHOLD_SECONDS
     Log To Console    Waiting for inactivity timeout to trigger conversation close...
 
-    # Wait for conversation job to complete (status changes from 'started' to 'completed')
+    # Wait for conversation job to complete (status changes from 'started' to 'finished')
     # Timeout value should be > SPEECH_INACTIVITY_THRESHOLD_SECONDS + buffer
-    Wait For Job Status    ${conv_job_id}    completed    timeout=30s    interval=2s
-    Log To Console    Conversation job completed (timeout triggered)
+    Wait For Job Status    ${conv_job_id}    finished    timeout=30s    interval=2s
+    Log To Console    Conversation job finished (timeout triggered)
 
     # Verify a NEW speech detection job (2nd one) was created for next conversation
     # The handle_end_of_conversation function creates a new speech_detection job
@@ -152,7 +152,7 @@ Conversation Closes On Inactivity Timeout And Restarts Speech Detection
     Log To Console    New speech detection job created for next conversation
 
     # Verify post-conversation jobs were enqueued (linked by conversation_id, not client_id)
-    # These jobs process the completed conversation: speaker recognition, memory, title
+    # These jobs process the finished conversation: speaker recognition, memory, title
     # Note: Streaming conversations no longer have batch transcription - transcript comes from streaming
     Log To Console    Verifying post-conversation jobs (speaker, memory, title)...
 
diff --git a/tests/integration/websocket_transcription_e2e_test.robot b/tests/integration/websocket_transcription_e2e_test.robot
index a555a22d..d45cec26 100644
--- a/tests/integration/websocket_transcription_e2e_test.robot
+++ b/tests/integration/websocket_transcription_e2e_test.robot
@@ -95,7 +95,7 @@ Speech Detection Receives Transcription From Stream
     ${job_id}=    Set Variable    ${speech_job}[job_id]
 
     # Wait for job to complete
-    Wait For Job Status    ${job_id}    completed    timeout=60s    interval=2s
+    Wait For Job Status    ${job_id}    finished    timeout=60s    interval=2s
 
     # Get job result
     ${result}=    Get Job Result    ${job_id}
@@ -133,8 +133,8 @@ Conversation Created With Valid Transcript
 
     Should Not Be Empty    ${conversation_id}    Conversation ID not found in open_conversation job metadata
 
-    # Wait for conversation to complete processing (inactivity timeout)
-    Wait For Job Status    ${conv_job}[job_id]    completed    timeout=60s    interval=2s
+    # Wait for conversation to complete started (inactivity timeout)
+    Wait For Job Status    ${conv_job}[job_id]    finished    timeout=60s    interval=2s
 
     # Retrieve the conversation
     ${conversation}=    Get Conversation By ID    ${conversation_id}
@@ -177,31 +177,16 @@ Stream Close Sends End Marker To Redis Stream
     Sleep    2s
 
     # Read all messages from audio stream to find end_marker
-    ${messages}=    Redis Command    XRANGE    ${audio_stream_name}    -    +
-
-    # Search for end_marker in messages
-    ${found_end_marker}=    Set Variable    ${False}
-    FOR    ${message}    IN    @{messages}
-        # Message format: [message_id, [field1, value1, field2, value2, ...]]
-        ${fields}=    Set Variable    ${message}[1]
-
-        # Check if 'end_marker' field exists
-        ${field_count}=    Get Length    ${fields}
-        FOR    ${index}    IN RANGE    0    ${field_count}    2
-            ${field_name}=    Set Variable    ${fields}[${index}]
-            IF    '${field_name}' == 'end_marker' or b'end_marker' in str($field_name)
-                ${found_end_marker}=    Set Variable    ${True}
-                Log    Found end_marker in audio stream at message ${message}[0]
-                BREAK
-            END
-        END
-
-        IF    ${found_end_marker}
-            BREAK
-        END
-    END
-
-    Should Be True    ${found_end_marker}    end_marker NOT found in Redis stream ${audio_stream_name}! Producer.finalize_session() did not send end_marker.
+    # Note: Redis Command returns string output from redis-cli, not a list
+    ${xrange_output}=    Redis Command    XRANGE    ${audio_stream_name}    -    +
+
+    # Search for end_marker in the redis-cli output string
+    # redis-cli XRANGE returns text with field names, so we just check if end_marker appears
+    ${found_end_marker}=    Run Keyword And Return Status
+    ...    Should Contain    ${xrange_output}    end_marker
+    ...    ignore_case=True
+
+    Should Be True    ${found_end_marker}    end_marker NOT found in Redis stream ${audio_stream_name}! Producer.finalize_session() did not send end_marker. XRANGE output: ${xrange_output}
 
     Log    ✅ end_marker successfully sent to Redis stream
 
diff --git a/tests/resources/audio_keywords.robot b/tests/resources/audio_keywords.robot
index d194c0c3..2baf48e9 100644
--- a/tests/resources/audio_keywords.robot
+++ b/tests/resources/audio_keywords.robot
@@ -44,8 +44,8 @@ Upload Audio File
       Log    Parsed upload response: ${upload_response}
 
       # Validate upload was successful
-      Should Be Equal As Strings    ${upload_response['summary']['processing']}    1    Upload failed: No files enqueued
-      Should Be Equal As Strings    ${upload_response['files'][0]['status']}    processing    Upload failed: ${response.text}
+      Should Be Equal As Strings    ${upload_response['summary']['started']}    1    Upload failed: No files enqueued
+      Should Be Equal As Strings    ${upload_response['files'][0]['status']}    started    Upload failed: ${response.text}
 
       # Extract important values
       ${job_id}=        Set Variable    ${upload_response['files'][0]['conversation_id']}
@@ -56,19 +56,19 @@ Upload Audio File
       # Wait for conversation to be created and transcribed
       Log    Waiting for transcription to complete...
 
-      Wait Until Keyword Succeeds    60s    5s       Check job status   ${transcript_job_id}    completed
+      Wait Until Keyword Succeeds    60s    5s       Check job status   ${transcript_job_id}    finished
       ${job}=    Get Job Details    ${transcript_job_id}
 
-     # Get the completed conversation
+     # Get the finished conversation
       ${conversation}=     Get Conversation By ID    ${job}[result][conversation_id]
-      Should Not Be Equal    ${conversation}    ${None}    Conversation not found after upload and processing
+      Should Not Be Equal    ${conversation}    ${None}    Conversation not found after upload and started
 
       Log    Found conversation: ${conversation}
       RETURN    ${conversation}
 
 
 Upload Audio File And Wait For Memory
-    [Documentation]    Upload audio file and wait for complete processing including memory extraction.
+    [Documentation]    Upload audio file and wait for complete started including memory extraction.
     ...                This is for E2E testing - use Upload Audio File for upload-only tests.
     ...                Performs assertions inline to verify successful memory extraction.
     [Arguments]    ${audio_file_path}    ${device_name}=robot-test    ${folder}=.    ${min_memories}=1
@@ -96,9 +96,9 @@ Upload Audio File And Wait For Memory
     Should Be True    ${result}[success]
     ...    Memory extraction failed: ${result.get('error_message', 'Unknown error')}
 
-    # Verify job completed successfully
-    Should Be Equal As Strings    ${result}[status]    completed
-    ...    Expected job status 'completed', got '${result}[status]'
+    # Verify job finished successfully
+    Should Be Equal As Strings    ${result}[status]    finished
+    ...    Expected job status 'finished', got '${result}[status]'
 
     # Verify minimum memories were extracted
     ${memory_count}=    Set Variable    ${result}[memory_count]
diff --git a/tests/resources/conversation_keywords.robot b/tests/resources/conversation_keywords.robot
index 50d7bd92..26d80739 100644
--- a/tests/resources/conversation_keywords.robot
+++ b/tests/resources/conversation_keywords.robot
@@ -48,7 +48,7 @@ Reprocess Transcript
     ${initial_status}=    Set Variable    ${reprocess_data}[status]
 
     Log    Reprocess job created: ${job_id} with status: ${initial_status}    INFO
-    Should Be True    '${initial_status}' in ['queued', 'processing']    Status should be 'queued' or 'processing', got: ${initial_status}
+    Should Be True    '${initial_status}' in ['queued', 'started']    Status should be 'queued' or 'started', got: ${initial_status}
 
     RETURN    ${response.json()}
 
@@ -123,7 +123,7 @@ Update Transcript Segment
 
 
 Create Test Conversation
-    [Documentation]    Create a test conversation by processing a test audio file
+    [Documentation]    Create a test conversation by started a test audio file
     [Arguments]     ${device_name}=test-device
 
     # Upload test audio file to create a conversation
@@ -154,7 +154,7 @@ Find Test Conversation
     Log    No conversations found, creating one by uploading test audio
     ${conversation}=    Upload Audio File    ${TEST_AUDIO_FILE}    ${TEST_DEVICE_NAME}
 
-    # Wait for initial processing to complete
+    # Wait for initial started to complete
     Sleep    5s
 
     RETURN    ${conversation}
diff --git a/tests/resources/memory_keywords.robot b/tests/resources/memory_keywords.robot
index 2ab79d9c..a18cc7cf 100644
--- a/tests/resources/memory_keywords.robot
+++ b/tests/resources/memory_keywords.robot
@@ -115,7 +115,7 @@ Wait For Memory Extraction
     ...                {
     ...                  'success': True/False,
     ...                  'error_message': 'Error description' (only if success=False),
-    ...                  'status': 'completed'/'failed'/'timeout'/'not_found',
+    ...                  'status': 'finished'/'failed'/'timeout'/'not_found',
     ...                  'job': {job object} (if available),
     ...                  'memories': [list of memories] (if successful),
     ...                  'memory_count': int (if successful)
@@ -170,9 +170,9 @@ Wait For Memory Extraction
         ${final_job}=    Set Variable    ${job}
         ${final_status}=    Set Variable    ${status}
 
-        # Success case - job completed
-        IF    '${status}' == 'completed' or '${status}' == 'finished'
-            Log    Memory job completed successfully
+        # Success case - job finished
+        IF    '${status}' == 'finished' or '${status}' == 'finished'
+            Log    Memory job finished successfully
             BREAK
         END
 
@@ -181,7 +181,7 @@ Wait For Memory Extraction
             ${error_info}=    Evaluate    $job.get('exc_info', 'Unknown error')
             ${result}=    Create Dictionary
             ...    success=${False}
-            ...    error_message=Memory job failed during processing: ${error_info}
+            ...    error_message=Memory job failed during started: ${error_info}
             ...    status=failed
             ...    job=${job}
             RETURN    ${result}
@@ -215,7 +215,7 @@ Wait For Memory Extraction
         # Return success result
         ${result}=    Create Dictionary
         ...    success=${True}
-        ...    status=completed
+        ...    status=finished
         ...    job=${final_job}
         ...    memories=${memories}
         ...    memory_count=${memory_count}
diff --git a/tests/resources/queue_keywords.robot b/tests/resources/queue_keywords.robot
index 80856883..dac88e17 100644
--- a/tests/resources/queue_keywords.robot
+++ b/tests/resources/queue_keywords.robot
@@ -59,7 +59,7 @@ Get Job Status
 
 Check job status
     [Documentation]    Check the status of a specific job by ID
-    ...                Fails immediately if job is in 'failed' state when expecting 'completed'
+    ...                Fails immediately if job is in 'failed' state when expecting 'finished'
     [Arguments]    ${job_id}    ${expected_status}
 
     ${job}=    Get Job status    ${job_id}
@@ -70,8 +70,8 @@ Check job status
     ${actual_status}=    Set Variable    ${job}[status]
     Log    Job ${job_id} status: ${actual_status} (expected: ${expected_status})
 
-    # Fail fast if job is in failed state when we're expecting completed
-    IF    '${actual_status}' == 'failed' and '${expected_status}' == 'completed'
+    # Fail fast if job is in failed state when we're expecting finished
+    IF    '${actual_status}' == 'failed' and '${expected_status}' == 'finished'
         ${error_msg}=    Evaluate    $job.get('error_message') or $job.get('exc_info') or $job.get('error', 'Unknown error')
         Fail    Job ${job_id} failed: ${error_msg}
     END
@@ -249,12 +249,13 @@ Cancel All Running Jobs
     END
 
 Flush In Progress Jobs
-    [Documentation]    Flush only queued and in-progress jobs (preserves completed/failed jobs)
-    ...                Use in test cleanup to reset queue state without losing job history
+    [Documentation]    Flush queued, in-progress, and finished jobs (preserves only failed jobs for debugging)
+    ...                Use in test cleanup to reset queue state between tests
+    ...                Includes finished jobs to prevent test contamination from previous runs
 
     Log To Console    Flushing in-progress and queued jobs...
     TRY
-        ${payload}=    Create Dictionary    confirm=${True}
+        ${payload}=    Create Dictionary    confirm=${True}    include_finished=${True}
         ${response}=    POST On Session    api    /api/queue/flush-all    json=${payload}    expected_status=200
         ${result}=    Set Variable    ${response.json()}
         Log To Console    Successfully flushed ${result}[total_removed] jobs
@@ -319,16 +320,16 @@ Get Conversation ID From Job Meta
     RETURN    ${conversation_id}
 
 Job Should Be Complete
-    [Documentation]    Check if job has reached a completed state (completed, finished, or failed)
+    [Documentation]    Check if job has reached a terminal state (finished or failed)
     [Arguments]    ${job_id}
 
     ${job}=    Get Job status    ${job_id}
     ${status}=    Set Variable    ${job}[status]
-    Should Be True    '${status}' in ['completed', 'finished', 'failed']    Job status: ${status}
+    Should Be True    '${status}' in ['finished', 'failed']    Job status: ${status}
 
 
 Get Job Result
-    [Documentation]    Get the result field of a completed job
+    [Documentation]    Get the result field of a finished job
     ...                Useful for checking job output/return values
     [Arguments]    ${job_id}
 
diff --git a/tests/resources/websocket_keywords.robot b/tests/resources/websocket_keywords.robot
index 1db7a212..51dd6f03 100644
--- a/tests/resources/websocket_keywords.robot
+++ b/tests/resources/websocket_keywords.robot
@@ -138,7 +138,7 @@ Cleanup All Audio Streams
 
 Stream And Wait For Conversation
     [Documentation]    Send audio chunks to stream, wait for conversation to be created and closed.
-    ...                Returns the conversation_id of the completed conversation.
+    ...                Returns the conversation_id of the finished conversation.
     ...                Works correctly even with existing conversations by tracking new conversation creation.
     [Arguments]    ${stream_id}    ${audio_file_path}    ${device_name}    ${num_chunks}=100
 
@@ -169,7 +169,7 @@ Stream And Wait For Conversation
     Log    New conversation created: ${conversation_id}
 
     # Wait for conversation to close via inactivity timeout (with queue drain, can take 45+ seconds)
-    Wait For Job Status    ${new_job}[job_id]    completed    timeout=60s    interval=2s
+    Wait For Job Status    ${new_job}[job_id]    finished    timeout=60s    interval=2s
     Log    Conversation closed: ${conversation_id}
 
     RETURN    ${conversation_id}
diff --git a/tests/run-no-api-tests.sh b/tests/run-no-api-tests.sh
index bb8cb8a9..98ae3241 100755
--- a/tests/run-no-api-tests.sh
+++ b/tests/run-no-api-tests.sh
@@ -72,9 +72,6 @@ if [ ! -f "setup/.env.test" ]; then
     print_info "Creating test environment file..."
     mkdir -p setup
 
-    # Set COMPOSE_PROJECT_NAME with fallback
-    COMPOSE_PROJECT_NAME_VALUE="${COMPOSE_PROJECT_NAME:-advanced-backend-test}"
-
     cat > setup/.env.test << EOF
 # API URLs
 API_URL=http://localhost:8001
@@ -89,11 +86,11 @@ ADMIN_PASSWORD=test-admin-password-123
 TEST_TIMEOUT=120
 TEST_DEVICE_NAME=robot-test
 
-# Docker Compose Project Name
-COMPOSE_PROJECT_NAME=${COMPOSE_PROJECT_NAME_VALUE}
-
 # Note: No API keys required for this test mode
 # OPENAI_API_KEY and DEEPGRAM_API_KEY are not needed
+
+# Note: Project name 'backend-test' is set in docker-compose-test.yml
+# COMPOSE_PROJECT_NAME is no longer needed
 EOF
     print_success "Created setup/.env.test"
 fi
diff --git a/tests/run-robot-tests.sh b/tests/run-robot-tests.sh
index 4c25fab2..40fabded 100755
--- a/tests/run-robot-tests.sh
+++ b/tests/run-robot-tests.sh
@@ -122,9 +122,6 @@ if [ ! -f "setup/.env.test" ]; then
     print_info "Creating test environment file..."
     mkdir -p setup
 
-    # Set COMPOSE_PROJECT_NAME with fallback
-    COMPOSE_PROJECT_NAME_VALUE="${COMPOSE_PROJECT_NAME:-advanced-backend-test}"
-
     cat > setup/.env.test << EOF
 # API URLs
 API_URL=http://localhost:8001
@@ -143,8 +140,8 @@ DEEPGRAM_API_KEY=${DEEPGRAM_API_KEY}
 TEST_TIMEOUT=120
 TEST_DEVICE_NAME=robot-test
 
-# Docker Compose Project Name
-COMPOSE_PROJECT_NAME=${COMPOSE_PROJECT_NAME_VALUE}
+# Note: Project name 'backend-test' is set in docker-compose-test.yml
+# COMPOSE_PROJECT_NAME is no longer needed
 EOF
     print_success "Created setup/.env.test"
 fi
diff --git a/tests/setup-test-containers.sh b/tests/setup-test-containers.sh
index 951db21c..8e12b84b 100755
--- a/tests/setup-test-containers.sh
+++ b/tests/setup-test-containers.sh
@@ -20,10 +20,10 @@ print_error() { echo -e "${RED}[ERROR]${NC} $1"; }
 SCRIPT_DIR="$(dirname "$0")"
 cd "$SCRIPT_DIR/../backends/advanced" || exit 1
 
-# Set default COMPOSE_PROJECT_NAME (can be overridden by .env.test)
-export COMPOSE_PROJECT_NAME="${COMPOSE_PROJECT_NAME:-advanced-backend-test}"
+# Note: Project name 'backend-test' is set in docker-compose-test.yml
+# No need to export COMPOSE_PROJECT_NAME - it's handled by the compose file
 
-# Load environment variables for tests (may override COMPOSE_PROJECT_NAME)
+# Load environment variables for tests
 if [ -f "$SCRIPT_DIR/setup/.env.test" ]; then
     print_info "Loading test environment..."
     set -a
@@ -53,10 +53,9 @@ if [ "$FRESH_BUILD" = "false" ]; then
     fi
 fi
 
-# Clean up any existing test containers from ANY project name to avoid port conflicts
+# Clean up any existing test containers to avoid port conflicts
 print_info "Cleaning up any existing test containers..."
 docker compose -f docker-compose-test.yml down 2>/dev/null || true
-COMPOSE_PROJECT_NAME=advanced docker compose -f docker-compose-test.yml down 2>/dev/null || true
 
 # Remove any stale "Created" containers that might be holding ports
 docker ps -a --filter "name=backend-test" --filter "status=created" --format "{{.Names}}" | xargs -r docker rm -f 2>/dev/null || true
diff --git a/tests/setup/test_manager_keywords.robot b/tests/setup/test_manager_keywords.robot
index a1935dc4..d306fa78 100644
--- a/tests/setup/test_manager_keywords.robot
+++ b/tests/setup/test_manager_keywords.robot
@@ -80,8 +80,8 @@ Clear Test Databases
     # Don't delete plugin database files - database is cleared via Clear Plugin Events keyword
     # Run Process    bash    -c    docker exec ${BACKEND_CONTAINER} find /app/debug_dir -name "*" -type f -delete || true    shell=True
 
-    # Clear Redis queues and job registries (preserve worker registrations, failed and completed jobs)
-    # Delete all rq:* keys except worker registrations (rq:worker:*), failed jobs (rq:failed:*), and completed jobs (rq:finished:*)
+    # Clear Redis queues and job registries (preserve worker registrations, failed and finished jobs)
+    # Delete all rq:* keys except worker registrations (rq:worker:*), failed jobs (rq:failed:*), and finished jobs (rq:finished:*)
     ${redis_clear_script}=    Set Variable    redis-cli --scan --pattern "rq:*" | grep -Ev "^rq:(worker|failed|finished)" | xargs -r redis-cli DEL; redis-cli --scan --pattern "audio:*" | xargs -r redis-cli DEL; redis-cli --scan --pattern "consumer:*" | xargs -r redis-cli DEL
     Run Process    docker    exec    ${REDIS_CONTAINER}    sh    -c    ${redis_clear_script}    shell=True
     Log To Console    Redis queues and job registries cleared (worker registrations preserved)
diff --git a/tests/teardown-test-containers.sh b/tests/teardown-test-containers.sh
index d335e40e..b1c38438 100755
--- a/tests/teardown-test-containers.sh
+++ b/tests/teardown-test-containers.sh
@@ -19,10 +19,10 @@ print_warning() { echo -e "${YELLOW}[WARNING]${NC} $1"; }
 SCRIPT_DIR="$(dirname "$0")"
 cd "$SCRIPT_DIR/../backends/advanced" || exit 1
 
-# Set default COMPOSE_PROJECT_NAME (can be overridden by .env.test)
-export COMPOSE_PROJECT_NAME="${COMPOSE_PROJECT_NAME:-advanced-backend-test}"
+# Note: Project name 'backend-test' is set in docker-compose-test.yml
+# No need to export COMPOSE_PROJECT_NAME - it's handled by the compose file
 
-# Load .env.test if available to get consistent project name
+# Load .env.test if available for other environment variables
 if [ -f "$SCRIPT_DIR/setup/.env.test" ]; then
     set -a
     source "$SCRIPT_DIR/setup/.env.test"

From 8b4d78385c95da5c6706af2ed60b7f9f47287088 Mon Sep 17 00:00:00 2001
From: Ankush Malaker <43288948+AnkushMalaker@users.noreply.github.com>
Date: Mon, 19 Jan 2026 18:29:46 +0000
Subject: [PATCH 02/14] Update test configurations and improve audio inactivity
 handling

- Increased `SPEECH_INACTIVITY_THRESHOLD_SECONDS` to 20 seconds in `docker-compose-test.yml` for better audio duration handling during tests.
- Refactored session handling in `session_controller.py` to clarify client ID usage.
- Updated `conversation_utils.py` to track speech activity using audio timestamps, enhancing accuracy in inactivity detection.
- Simplified test scripts by removing unnecessary `COMPOSE_PROJECT_NAME` references, aligning with the new project naming convention.
- Adjusted integration tests to reflect changes in inactivity timeout and ensure proper handling of audio timestamps.
---
 backends/advanced/docker-compose-test.yml     | 10 +++---
 .../controllers/session_controller.py         |  5 +--
 .../routers/modules/annotation_routes.py      |  4 +--
 .../utils/conversation_utils.py               | 34 +++++++++++++++----
 .../workers/conversation_jobs.py              | 21 +++++++++---
 tests/.env.test                               |  5 +--
 tests/bin/start-containers.sh                 |  3 --
 tests/endpoints/rq_queue_tests.robot          |  6 ++--
 tests/infrastructure/infra_tests.robot        |  3 +-
 .../websocket_streaming_tests.robot           | 13 +++----
 tests/run-no-api-tests.sh                     |  3 --
 tests/run-robot-tests.sh                      |  3 --
 tests/setup-test-containers.sh                |  3 --
 tests/setup/test_env.py                       | 16 ++++-----
 tests/teardown-test-containers.sh             |  3 --
 15 files changed, 73 insertions(+), 59 deletions(-)

diff --git a/backends/advanced/docker-compose-test.yml b/backends/advanced/docker-compose-test.yml
index e89102f5..c6df21f4 100644
--- a/backends/advanced/docker-compose-test.yml
+++ b/backends/advanced/docker-compose-test.yml
@@ -47,8 +47,9 @@ services:
       # Speaker recognition controlled by config.yml (disabled in test config for CI performance)
       - SPEAKER_SERVICE_URL=http://speaker-service-test:8085
       - CORS_ORIGINS=http://localhost:3001,http://localhost:8001,https://localhost:3001,https://localhost:8001
-      # Set low inactivity timeout for tests (2 seconds instead of 60)
-      - SPEECH_INACTIVITY_THRESHOLD_SECONDS=2
+      # Set inactivity timeout for tests (20 seconds of audio time)
+      # This is audio duration, not wall-clock time
+      - SPEECH_INACTIVITY_THRESHOLD_SECONDS=20
       # Set low speech detection thresholds for tests
       - SPEECH_DETECTION_MIN_DURATION=2.0  # 2 seconds instead of 10
       - SPEECH_DETECTION_MIN_WORDS=5  # 5 words instead of 10
@@ -194,8 +195,9 @@ services:
       - MYCELIA_DB=mycelia_test
       # Speaker recognition controlled by config.yml (disabled in test config for CI performance)
       - SPEAKER_SERVICE_URL=http://speaker-service-test:8085
-      # Set low inactivity timeout for tests (2 seconds instead of 60)
-      - SPEECH_INACTIVITY_THRESHOLD_SECONDS=2
+      # Set inactivity timeout for tests (20 seconds of audio time)
+      # This is audio duration, not wall-clock time
+      - SPEECH_INACTIVITY_THRESHOLD_SECONDS=20
       # Set low speech detection thresholds for tests
       - SPEECH_DETECTION_MIN_DURATION=2.0  # 2 seconds instead of 10
       - SPEECH_DETECTION_MIN_WORDS=5  # 5 words instead of 10
diff --git a/backends/advanced/src/advanced_omi_backend/controllers/session_controller.py b/backends/advanced/src/advanced_omi_backend/controllers/session_controller.py
index 165bb4c3..2e12e3e1 100644
--- a/backends/advanced/src/advanced_omi_backend/controllers/session_controller.py
+++ b/backends/advanced/src/advanced_omi_backend/controllers/session_controller.py
@@ -199,7 +199,7 @@ async def get_streaming_status(request):
         transcription_queue,
         memory_queue,
         default_queue,
-        all_jobs_complete_for_session
+        all_jobs_complete_for_client
     )
 
     try:
@@ -229,7 +229,8 @@ async def get_streaming_status(request):
 
             # Separate active and completed sessions
             # Check if all jobs are complete (including failed jobs)
-            all_jobs_done = all_jobs_complete_for_session(session_id)
+            # Note: session_id == client_id in streaming context, but using client_id explicitly
+            all_jobs_done = all_jobs_complete_for_client(session_obj.get("client_id"))
 
             # Session is finished if:
             # 1. Redis status says finished AND all jobs done, OR
diff --git a/backends/advanced/src/advanced_omi_backend/routers/modules/annotation_routes.py b/backends/advanced/src/advanced_omi_backend/routers/modules/annotation_routes.py
index dc2bbd3f..e8d36d1e 100644
--- a/backends/advanced/src/advanced_omi_backend/routers/modules/annotation_routes.py
+++ b/backends/advanced/src/advanced_omi_backend/routers/modules/annotation_routes.py
@@ -124,7 +124,7 @@ async def create_transcript_annotation(
             raise HTTPException(status_code=404, detail="Conversation not found")
 
         # Validate segment index
-        active_transcript = conversation.get_active_transcript()
+        active_transcript = conversation.active_transcript
         if (
             not active_transcript
             or annotation_data.segment_index >= len(active_transcript.segments)
@@ -288,7 +288,7 @@ async def update_annotation_status(
                         Conversation.user_id == annotation.user_id
                     )
                     if conversation:
-                        transcript = conversation.get_active_transcript()
+                        transcript = conversation.active_transcript
                         if (
                             transcript
                             and annotation.segment_index < len(transcript.segments)
diff --git a/backends/advanced/src/advanced_omi_backend/utils/conversation_utils.py b/backends/advanced/src/advanced_omi_backend/utils/conversation_utils.py
index c0f92408..03f75dc3 100644
--- a/backends/advanced/src/advanced_omi_backend/utils/conversation_utils.py
+++ b/backends/advanced/src/advanced_omi_backend/utils/conversation_utils.py
@@ -438,23 +438,46 @@ async def track_speech_activity(
     speech_analysis: Dict[str, Any], last_word_count: int, conversation_id: str, redis_client
 ) -> tuple[float, int]:
     """
-    Track new speech activity and update last speech timestamp.
+    Track new speech activity and update last speech timestamp using audio timestamps.
 
-    Uses word count instead of chunk count to avoid false positives from noise/silence.
+    Uses word count to detect new speech, and audio timestamps (speech_end) to track
+    when the last speech occurred in the audio stream (not wall-clock time).
 
     Args:
-        speech_analysis: Speech analysis results from analyze_speech()
+        speech_analysis: Speech analysis results from analyze_speech() with:
+            - word_count: Number of words detected
+            - speech_end: Audio timestamp of last word (if available)
+            - fallback: True if using text-only analysis without timing
         last_word_count: Previous word count
         conversation_id: Conversation ID for Redis key
         redis_client: Redis client instance
 
     Returns:
         Tuple of (last_meaningful_speech_time, new_word_count)
+        Note: last_meaningful_speech_time is audio timestamp, NOT wall-clock time
     """
     current_word_count = speech_analysis.get("word_count", 0)
 
     if current_word_count > last_word_count:
-        last_meaningful_speech_time = time.time()
+        # Use audio timestamp (speech_end) when available
+        speech_end = speech_analysis.get("speech_end")
+        is_fallback = speech_analysis.get("fallback", False)
+
+        if speech_end is not None and speech_end > 0:
+            # Preferred: Use audio timestamp from word-level timing
+            last_meaningful_speech_time = speech_end
+            logger.debug(
+                f"🗣️ New speech detected (word count: {current_word_count}), "
+                f"audio timestamp: {speech_end:.2f}s"
+            )
+        else:
+            # Fallback: Use wall-clock time when word-level timing unavailable
+            # This happens with text-only transcription or missing timing data
+            last_meaningful_speech_time = time.time()
+            logger.warning(
+                f"⚠️ Using wall-clock time for speech tracking (no audio timestamps available). "
+                f"Word count: {current_word_count}, fallback={is_fallback}"
+            )
 
         # Store timestamp in Redis for visibility/debugging
         await redis_client.set(
@@ -462,9 +485,6 @@ async def track_speech_activity(
             last_meaningful_speech_time,
             ex=86400,  # 24 hour TTL
         )
-        logger.debug(
-            f"🗣️ New speech detected (word count: {current_word_count}), updated last_speech timestamp"
-        )
 
         return last_meaningful_speech_time, current_word_count
 
diff --git a/backends/advanced/src/advanced_omi_backend/workers/conversation_jobs.py b/backends/advanced/src/advanced_omi_backend/workers/conversation_jobs.py
index 8edc01e4..d0650f75 100644
--- a/backends/advanced/src/advanced_omi_backend/workers/conversation_jobs.py
+++ b/backends/advanced/src/advanced_omi_backend/workers/conversation_jobs.py
@@ -289,9 +289,9 @@ async def open_conversation_job(
     # Inactivity timeout configuration
     inactivity_timeout_seconds = float(os.getenv("SPEECH_INACTIVITY_THRESHOLD_SECONDS", "60"))
     inactivity_timeout_minutes = inactivity_timeout_seconds / 60
-    last_meaningful_speech_time = time.time()  # Initialize with conversation start
+    last_meaningful_speech_time = 0.0  # Initialize with audio time 0 (will be updated with first speech)
     timeout_triggered = False  # Track if closure was due to timeout
-    last_inactivity_log_time = time.time()  # Track when we last logged inactivity
+    last_inactivity_log_time = time.time()  # Track when we last logged inactivity (wall-clock for logging)
     last_word_count = 0  # Track word count to detect actual new speech
 
     # Test mode: wait for audio queue to drain before timing out
@@ -407,8 +407,21 @@ async def open_conversation_job(
             last_meaningful_speech_time=last_meaningful_speech_time,
         )
 
-        # Check inactivity timeout and log every 10 seconds
-        inactivity_duration = time.time() - last_meaningful_speech_time
+        # Check inactivity timeout using audio time (not wall-clock time)
+        # Get current audio time from latest transcription
+        current_audio_time = speech_analysis.get("speech_end", 0.0)
+
+        # Calculate inactivity based on audio timestamps
+        # Only check if we have valid audio timing data
+        if current_audio_time > 0 and last_meaningful_speech_time > 0:
+            inactivity_duration = current_audio_time - last_meaningful_speech_time
+        else:
+            # Fallback: No audio timestamps available (text-only transcription)
+            # Can't reliably detect inactivity, so skip timeout check this iteration
+            inactivity_duration = 0
+            if speech_analysis.get("fallback", False):
+                logger.debug("⚠️ Skipping inactivity check (no audio timestamps available)")
+
         current_time = time.time()
 
         # Log inactivity every 10 seconds
diff --git a/tests/.env.test b/tests/.env.test
index 652e028e..b26c757c 100644
--- a/tests/.env.test
+++ b/tests/.env.test
@@ -17,7 +17,4 @@ MEMORY_PROVIDER=chronicle
 
 # MongoDB Configuration (test environment)
 MONGODB_URI=mongodb://localhost:27018
-TEST_DB_NAME=test_db
-
-# Docker Compose Project Name (used by test_env.py to generate container names)
-COMPOSE_PROJECT_NAME=advanced-backend-test
\ No newline at end of file
+TEST_DB_NAME=test_db
\ No newline at end of file
diff --git a/tests/bin/start-containers.sh b/tests/bin/start-containers.sh
index a2f33602..b3fed506 100755
--- a/tests/bin/start-containers.sh
+++ b/tests/bin/start-containers.sh
@@ -10,9 +10,6 @@ BACKEND_DIR="$TESTS_DIR/../backends/advanced"
 
 cd "$BACKEND_DIR"
 
-# Note: Project name 'backend-test' is set in docker-compose-test.yml
-# No need to export COMPOSE_PROJECT_NAME - it's handled by the compose file
-
 echo "🚀 Starting test containers..."
 
 # Check if .env.test exists, create from template if needed
diff --git a/tests/endpoints/rq_queue_tests.robot b/tests/endpoints/rq_queue_tests.robot
index f2d6ce7c..cbd58d96 100644
--- a/tests/endpoints/rq_queue_tests.robot
+++ b/tests/endpoints/rq_queue_tests.robot
@@ -28,12 +28,10 @@ Restart Backend Service
     [Documentation]    Restart the backend service to test persistence
     Log    Restarting backend service to test job persistence
 
-    # Get COMPOSE_PROJECT_NAME from environment
-    ${project_name}=    Get Environment Variable    COMPOSE_PROJECT_NAME    default=advanced-backend-test
-
     # Restart backend container (handles dependencies properly)
+    # Project name 'backend-test' is set in docker-compose-test.yml
     Run Process    docker    compose    -f    ${COMPOSE_FILE}    restart    chronicle-backend-test
-    ...    cwd=${BACKEND_DIR}    timeout=60s    shell=True    env:COMPOSE_PROJECT_NAME=${project_name}
+    ...    cwd=${BACKEND_DIR}    timeout=60s    shell=True
 
     # Wait for backend to be ready again (configurable timeout for slow tests)
     Wait Until Keyword Succeeds    ${wait_timeout}    5s
diff --git a/tests/infrastructure/infra_tests.robot b/tests/infrastructure/infra_tests.robot
index 35cbe967..59ac95c1 100644
--- a/tests/infrastructure/infra_tests.robot
+++ b/tests/infrastructure/infra_tests.robot
@@ -26,8 +26,7 @@ Suite Setup      Suite Setup
 Suite Teardown   Suite Teardown
 Test Setup       Test Cleanup
 *** Variables ***
-# Container names are now dynamically loaded from test_env.py based on COMPOSE_PROJECT_NAME
-# This allows tests to work with different docker-compose project names
+# Container names are loaded from test_env.py (hardcoded to match docker-compose-test.yml project name)
 
 *** Keywords ***
 
diff --git a/tests/integration/websocket_streaming_tests.robot b/tests/integration/websocket_streaming_tests.robot
index 18dbcaa5..63baadf8 100644
--- a/tests/integration/websocket_streaming_tests.robot
+++ b/tests/integration/websocket_streaming_tests.robot
@@ -103,21 +103,22 @@ Conversation Job Created After Speech Detection
 
 
 Conversation Closes On Inactivity Timeout And Restarts Speech Detection
-    [Documentation]    Verify that after SPEECH_INACTIVITY_THRESHOLD_SECONDS of silence,
+    [Documentation]    Verify that after SPEECH_INACTIVITY_THRESHOLD_SECONDS of silence (audio time),
     ...                the open_conversation job closes with timeout_triggered=True,
     ...                a new speech_detection job is created for the next conversation,
     ...                and post-conversation jobs are enqueued (speaker, memory, title).
     ...                Note: Streaming conversations use streaming transcript (no batch transcription).
     ...
-    ...                Test environment sets SPEECH_INACTIVITY_THRESHOLD_SECONDS=5 in docker-compose-test.yml.
-    [Tags]    audio-streaming	queue	conversation
+    ...                Test environment sets SPEECH_INACTIVITY_THRESHOLD_SECONDS=20 in docker-compose-test.yml.
+    [Tags]    audio-streaming	queue	conversation	slow
 
     ${device_name}=    Set Variable    test-post
     ${client_id}=    Get Client ID From Device Name    ${device_name}
 
     # Open stream and send enough audio to trigger speech detection and conversation
     ${stream_id}=    Open Audio Stream    device_name=${device_name}
-    Send Audio Chunks To Stream    ${stream_id}    ${TEST_AUDIO_FILE}    num_chunks=200
+    # Use realtime pacing so Deepgram can finalize transcription segments as audio streams in
+    Send Audio Chunks To Stream    ${stream_id}    ${TEST_AUDIO_FILE}    num_chunks=200    realtime_pacing=True
 
     # Wait for conversation job to be created (transcription + speech analysis takes time)
     ${conv_jobs}=    Wait Until Keyword Succeeds    60s    3s
@@ -138,8 +139,8 @@ Conversation Closes On Inactivity Timeout And Restarts Speech Detection
     Log To Console    Waiting for inactivity timeout to trigger conversation close...
 
     # Wait for conversation job to complete (status changes from 'started' to 'finished')
-    # Timeout value should be > SPEECH_INACTIVITY_THRESHOLD_SECONDS + buffer
-    Wait For Job Status    ${conv_job_id}    finished    timeout=30s    interval=2s
+    # Timeout needs: (audio send time ~60s) + (silence timeout 20s) + (buffer 10s) = 90s
+    Wait For Job Status    ${conv_job_id}    finished    timeout=90s    interval=2s
     Log To Console    Conversation job finished (timeout triggered)
 
     # Verify a NEW speech detection job (2nd one) was created for next conversation
diff --git a/tests/run-no-api-tests.sh b/tests/run-no-api-tests.sh
index 98ae3241..25d04f97 100755
--- a/tests/run-no-api-tests.sh
+++ b/tests/run-no-api-tests.sh
@@ -88,9 +88,6 @@ TEST_DEVICE_NAME=robot-test
 
 # Note: No API keys required for this test mode
 # OPENAI_API_KEY and DEEPGRAM_API_KEY are not needed
-
-# Note: Project name 'backend-test' is set in docker-compose-test.yml
-# COMPOSE_PROJECT_NAME is no longer needed
 EOF
     print_success "Created setup/.env.test"
 fi
diff --git a/tests/run-robot-tests.sh b/tests/run-robot-tests.sh
index 40fabded..015b63e0 100755
--- a/tests/run-robot-tests.sh
+++ b/tests/run-robot-tests.sh
@@ -139,9 +139,6 @@ DEEPGRAM_API_KEY=${DEEPGRAM_API_KEY}
 # Test Configuration
 TEST_TIMEOUT=120
 TEST_DEVICE_NAME=robot-test
-
-# Note: Project name 'backend-test' is set in docker-compose-test.yml
-# COMPOSE_PROJECT_NAME is no longer needed
 EOF
     print_success "Created setup/.env.test"
 fi
diff --git a/tests/setup-test-containers.sh b/tests/setup-test-containers.sh
index 8e12b84b..8ff3ff45 100755
--- a/tests/setup-test-containers.sh
+++ b/tests/setup-test-containers.sh
@@ -20,9 +20,6 @@ print_error() { echo -e "${RED}[ERROR]${NC} $1"; }
 SCRIPT_DIR="$(dirname "$0")"
 cd "$SCRIPT_DIR/../backends/advanced" || exit 1
 
-# Note: Project name 'backend-test' is set in docker-compose-test.yml
-# No need to export COMPOSE_PROJECT_NAME - it's handled by the compose file
-
 # Load environment variables for tests
 if [ -f "$SCRIPT_DIR/setup/.env.test" ]; then
     print_info "Loading test environment..."
diff --git a/tests/setup/test_env.py b/tests/setup/test_env.py
index a7cdc363..924d0592 100644
--- a/tests/setup/test_env.py
+++ b/tests/setup/test_env.py
@@ -81,12 +81,10 @@
     "default_timeout": 30
 }
 
-# Docker Container Names (dynamically based on COMPOSE_PROJECT_NAME)
-# Default to 'advanced' if not set (which is the directory name)
-COMPOSE_PROJECT_NAME = os.getenv('COMPOSE_PROJECT_NAME', 'advanced')
-BACKEND_CONTAINER = f"{COMPOSE_PROJECT_NAME}-chronicle-backend-test-1"
-WORKERS_CONTAINER = f"{COMPOSE_PROJECT_NAME}-workers-test-1"
-MONGO_CONTAINER = f"{COMPOSE_PROJECT_NAME}-mongo-test-1"
-REDIS_CONTAINER = f"{COMPOSE_PROJECT_NAME}-redis-test-1"
-QDRANT_CONTAINER = f"{COMPOSE_PROJECT_NAME}-qdrant-test-1"
-WEBUI_CONTAINER = f"{COMPOSE_PROJECT_NAME}-webui-test-1"
+# Docker Container Names (based on docker-compose-test.yml project name: backend-test)
+BACKEND_CONTAINER = "backend-test-chronicle-backend-test-1"
+WORKERS_CONTAINER = "backend-test-workers-test-1"
+MONGO_CONTAINER = "backend-test-mongo-test-1"
+REDIS_CONTAINER = "backend-test-redis-test-1"
+QDRANT_CONTAINER = "backend-test-qdrant-test-1"
+WEBUI_CONTAINER = "backend-test-webui-test-1"
diff --git a/tests/teardown-test-containers.sh b/tests/teardown-test-containers.sh
index b1c38438..9a86e7f7 100755
--- a/tests/teardown-test-containers.sh
+++ b/tests/teardown-test-containers.sh
@@ -19,9 +19,6 @@ print_warning() { echo -e "${YELLOW}[WARNING]${NC} $1"; }
 SCRIPT_DIR="$(dirname "$0")"
 cd "$SCRIPT_DIR/../backends/advanced" || exit 1
 
-# Note: Project name 'backend-test' is set in docker-compose-test.yml
-# No need to export COMPOSE_PROJECT_NAME - it's handled by the compose file
-
 # Load .env.test if available for other environment variables
 if [ -f "$SCRIPT_DIR/setup/.env.test" ]; then
     set -a

From 42eb911d41ca42b04a90b8a34181653edc8bfad6 Mon Sep 17 00:00:00 2001
From: Ankush Malaker <43288948+AnkushMalaker@users.noreply.github.com>
Date: Tue, 20 Jan 2026 05:59:19 +0000
Subject: [PATCH 03/14] Refactor audio processing and enhance error handling

- Updated `worker_orchestrator.py` to use `logger.exception` for improved error logging.
- Changed default MongoDB database name from "friend-lite" to "chronicle" in multiple files for consistency.
- Added a new method `close_stream_without_stop` in `audio_stream_client.py` to handle abrupt WebSocket disconnections.
- Enhanced audio validation in `audio_utils.py` to support automatic resampling of audio data if sample rates do not match.
- Improved logging in various modules to provide clearer insights during audio processing and event dispatching.
---
 .../src/advanced_omi_backend/app_config.py    |   3 +-
 .../clients/audio_stream_client.py            |  33 +++++
 .../controllers/audio_controller.py           |   3 +-
 .../controllers/queue_controller.py           |   1 +
 .../controllers/session_controller.py         |   5 +-
 .../controllers/websocket_controller.py       |  20 ++-
 .../src/advanced_omi_backend/database.py      |   2 +-
 .../middleware/app_middleware.py              |   1 +
 .../src/advanced_omi_backend/models/job.py    |   2 +-
 .../advanced_omi_backend/plugins/router.py    |  33 ++++-
 .../plugins/test_event/event_storage.py       |  56 ++++++--
 .../plugins/test_event/plugin.py              |  37 +++--
 .../services/audio_stream/producer.py         |  16 ++-
 .../advanced_omi_backend/utils/audio_utils.py | 118 +++++++++++++--
 .../workers/conversation_jobs.py              | 136 +++++++++++-------
 .../workers/memory_jobs.py                    |   9 ++
 .../workers/speaker_jobs.py                   |  31 +++-
 .../workers/transcription_jobs.py             |  12 +-
 backends/advanced/worker_orchestrator.py      |   6 +-
 .../api/routers/identification.py             |  14 +-
 .../tests/test_speaker_service_integration.py | 112 +++++++++++++--
 tests/infrastructure/infra_tests.robot        |  59 ++++++--
 .../audio_streaming_integration_tests.robot   |   6 +-
 tests/integration/plugin_event_tests.robot    |   6 +-
 tests/libs/audio_stream_library.py            |   9 ++
 tests/resources/queue_keywords.robot          |   2 +-
 tests/resources/websocket_keywords.robot      |  11 ++
 27 files changed, 601 insertions(+), 142 deletions(-)

diff --git a/backends/advanced/src/advanced_omi_backend/app_config.py b/backends/advanced/src/advanced_omi_backend/app_config.py
index 15e825ec..c87398f3 100644
--- a/backends/advanced/src/advanced_omi_backend/app_config.py
+++ b/backends/advanced/src/advanced_omi_backend/app_config.py
@@ -29,8 +29,7 @@ class AppConfig:
     def __init__(self):
         # MongoDB Configuration
         self.mongodb_uri = os.getenv("MONGODB_URI", "mongodb://mongo:27017")
-        # default to legacy value to avoid breaking peoples .env
-        self.mongodb_database = os.getenv("MONGODB_DATABASE", "friend-lite")
+        self.mongodb_database = os.getenv("MONGODB_DATABASE", "chronicle")
         self.mongo_client = AsyncIOMotorClient(self.mongodb_uri)
         self.db = self.mongo_client.get_default_database(self.mongodb_database)
         self.users_col = self.db["users"]
diff --git a/backends/advanced/src/advanced_omi_backend/clients/audio_stream_client.py b/backends/advanced/src/advanced_omi_backend/clients/audio_stream_client.py
index 07a401a4..ee33b86c 100644
--- a/backends/advanced/src/advanced_omi_backend/clients/audio_stream_client.py
+++ b/backends/advanced/src/advanced_omi_backend/clients/audio_stream_client.py
@@ -555,6 +555,39 @@ async def _stop():
         logger.info(f"Stream {stream_id} stopped, sent {total_chunks} chunks")
         return total_chunks
 
+    def close_stream_without_stop(self, stream_id: str) -> int:
+        """Close WebSocket connection without sending audio-stop event.
+
+        This simulates abrupt disconnection (network failure, client crash)
+        and should trigger websocket_disconnect end_reason.
+
+        Args:
+            stream_id: Stream session ID
+
+        Returns:
+            Total chunks sent during this session
+        """
+        session = self._sessions.get(stream_id)
+        if not session:
+            raise ValueError(f"Unknown stream_id: {stream_id}")
+
+        async def _close_abruptly():
+            # Just close the connection without audio-stop
+            await session.client.close()
+
+        future = asyncio.run_coroutine_threadsafe(_close_abruptly(), session.loop)
+        future.result(timeout=10)
+
+        # Stop the event loop
+        session.loop.call_soon_threadsafe(session.loop.stop)
+        session.thread.join(timeout=5)
+
+        total_chunks = session.chunk_count
+        del self._sessions[stream_id]
+
+        logger.info(f"Stream {stream_id} closed abruptly (no audio-stop), sent {total_chunks} chunks")
+        return total_chunks
+
     def get_session(self, stream_id: str) -> Optional[StreamSession]:
         """Get session info for a stream."""
         return self._sessions.get(stream_id)
diff --git a/backends/advanced/src/advanced_omi_backend/controllers/audio_controller.py b/backends/advanced/src/advanced_omi_backend/controllers/audio_controller.py
index d726a392..a2321d58 100644
--- a/backends/advanced/src/advanced_omi_backend/controllers/audio_controller.py
+++ b/backends/advanced/src/advanced_omi_backend/controllers/audio_controller.py
@@ -94,7 +94,8 @@ async def upload_and_process_audio_files(
                     audio_data, sample_rate, sample_width, channels, duration = await validate_and_prepare_audio(
                         audio_data=content,
                         expected_sample_rate=16000,  # Expecting 16kHz
-                        convert_to_mono=True  # Convert stereo to mono
+                        convert_to_mono=True,  # Convert stereo to mono
+                        auto_resample=True  # Auto-resample if sample rate doesn't match
                     )
                 except AudioValidationError as e:
                     processed_files.append({
diff --git a/backends/advanced/src/advanced_omi_backend/controllers/queue_controller.py b/backends/advanced/src/advanced_omi_backend/controllers/queue_controller.py
index d804df95..17a4899d 100644
--- a/backends/advanced/src/advanced_omi_backend/controllers/queue_controller.py
+++ b/backends/advanced/src/advanced_omi_backend/controllers/queue_controller.py
@@ -537,6 +537,7 @@ def start_post_conversation_jobs(
         conversation_id,
         client_id or "",
         user_id,
+        "file_upload",  # Explicit end_reason for file upload processing
         job_timeout=120,  # 2 minutes
         result_ttl=JOB_RESULT_TTL,
         depends_on=[memory_job, title_summary_job],  # Wait for both parallel jobs
diff --git a/backends/advanced/src/advanced_omi_backend/controllers/session_controller.py b/backends/advanced/src/advanced_omi_backend/controllers/session_controller.py
index 2e12e3e1..fe9b87cd 100644
--- a/backends/advanced/src/advanced_omi_backend/controllers/session_controller.py
+++ b/backends/advanced/src/advanced_omi_backend/controllers/session_controller.py
@@ -56,12 +56,13 @@ async def mark_session_complete(
         await mark_session_complete(redis, session_id, "all_jobs_complete")
     """
     session_key = f"audio:session:{session_id}"
+    mark_time = time.time()
     await redis_client.hset(session_key, mapping={
         "status": "finished",
-        "completed_at": str(time.time()),
+        "completed_at": str(mark_time),
         "completion_reason": reason
     })
-    logger.info(f"✅ Session {session_id[:12]} marked finished: {reason}")
+    logger.info(f"✅ Session {session_id[:12]} marked finished: {reason} [TIME: {mark_time:.3f}]")
 
 
 async def get_session_info(redis_client, session_id: str) -> Optional[Dict]:
diff --git a/backends/advanced/src/advanced_omi_backend/controllers/websocket_controller.py b/backends/advanced/src/advanced_omi_backend/controllers/websocket_controller.py
index 79bb56fc..fa5b23b2 100644
--- a/backends/advanced/src/advanced_omi_backend/controllers/websocket_controller.py
+++ b/backends/advanced/src/advanced_omi_backend/controllers/websocket_controller.py
@@ -238,6 +238,10 @@ async def cleanup_client_state(client_id: str):
         redis_url = os.getenv("REDIS_URL", "redis://localhost:6379/0")
         async_redis = redis.from_url(redis_url, decode_responses=False)
 
+        # Get audio stream producer for finalization
+        from advanced_omi_backend.services.audio_stream.producer import get_audio_stream_producer
+        audio_stream_producer = get_audio_stream_producer()
+
         # Find all session keys for this client and mark them complete
         pattern = f"audio:session:*"
         cursor = 0
@@ -250,8 +254,18 @@ async def cleanup_client_state(client_id: str):
                 # Check if this session belongs to this client
                 client_id_bytes = await async_redis.hget(key, "client_id")
                 if client_id_bytes and client_id_bytes.decode() == client_id:
-                    # Mark session as complete (WebSocket disconnected)
                     session_id = key.decode().replace("audio:session:", "")
+
+                    # Check session status
+                    status_bytes = await async_redis.hget(key, "status")
+                    status = status_bytes.decode() if status_bytes else None
+
+                    # If session is still active, finalize it first (sets status + completion_reason atomically)
+                    if status in ["active", None]:
+                        logger.info(f"📊 Finalizing active session {session_id[:12]} due to WebSocket disconnect")
+                        await audio_stream_producer.finalize_session(session_id, completion_reason="websocket_disconnect")
+
+                    # Mark session as complete (WebSocket disconnected)
                     await mark_session_complete(async_redis, session_id, "websocket_disconnect")
                     sessions_closed += 1
 
@@ -485,8 +499,8 @@ async def _finalize_streaming_session(
         # Send end-of-session signal to workers
         await audio_stream_producer.send_session_end_signal(session_id)
 
-        # Mark session as finalizing
-        await audio_stream_producer.finalize_session(session_id)
+        # Mark session as finalizing with user_stopped reason (audio-stop event)
+        await audio_stream_producer.finalize_session(session_id, completion_reason="user_stopped")
 
         # NOTE: Finalize job disabled - open_conversation_job now handles everything
         # The open_conversation_job will:
diff --git a/backends/advanced/src/advanced_omi_backend/database.py b/backends/advanced/src/advanced_omi_backend/database.py
index ae7650b0..1b214b6d 100644
--- a/backends/advanced/src/advanced_omi_backend/database.py
+++ b/backends/advanced/src/advanced_omi_backend/database.py
@@ -14,7 +14,7 @@
 
 # MongoDB Configuration
 MONGODB_URI = os.getenv("MONGODB_URI", "mongodb://mongo:27017")
-MONGODB_DATABASE = os.getenv("MONGODB_DATABASE", "friend-lite")
+MONGODB_DATABASE = os.getenv("MONGODB_DATABASE", "chronicle")
 
 mongo_client = AsyncIOMotorClient(
     MONGODB_URI,
diff --git a/backends/advanced/src/advanced_omi_backend/middleware/app_middleware.py b/backends/advanced/src/advanced_omi_backend/middleware/app_middleware.py
index 4cff21eb..069d5239 100644
--- a/backends/advanced/src/advanced_omi_backend/middleware/app_middleware.py
+++ b/backends/advanced/src/advanced_omi_backend/middleware/app_middleware.py
@@ -60,6 +60,7 @@ class RequestLoggingMiddleware(BaseHTTPMiddleware):
         "/health",
         "/auth/health",
         "/readiness",
+        "/api/queue/dashboard",  # Auto-refresh endpoint, too noisy
     }
 
     # Binary content types to exclude
diff --git a/backends/advanced/src/advanced_omi_backend/models/job.py b/backends/advanced/src/advanced_omi_backend/models/job.py
index f2d85add..5d906865 100644
--- a/backends/advanced/src/advanced_omi_backend/models/job.py
+++ b/backends/advanced/src/advanced_omi_backend/models/job.py
@@ -44,7 +44,7 @@ async def _ensure_beanie_initialized():
             mongodb_uri = os.getenv("MONGODB_URI", "mongodb://localhost:27017")
 
             # Create MongoDB client
-            mongodb_database = os.getenv("MONGODB_DATABASE", "friend-lite")
+            mongodb_database = os.getenv("MONGODB_DATABASE", "chronicle")
             client = AsyncIOMotorClient(mongodb_uri)
             try:
                 database = client.get_default_database(mongodb_database)
diff --git a/backends/advanced/src/advanced_omi_backend/plugins/router.py b/backends/advanced/src/advanced_omi_backend/plugins/router.py
index f046520c..523fe3ed 100644
--- a/backends/advanced/src/advanced_omi_backend/plugins/router.py
+++ b/backends/advanced/src/advanced_omi_backend/plugins/router.py
@@ -122,23 +122,37 @@ async def dispatch_event(
         Returns:
             List of plugin results
         """
+        # Add at start
+        logger.info(f"🔌 ROUTER: Dispatching '{event}' event (user={user_id})")
+
         results = []
 
         # Get plugins subscribed to this event
         plugin_ids = self._plugins_by_event.get(event, [])
 
+        # Add subscription check
+        if not plugin_ids:
+            logger.warning(f"🔌 ROUTER: No plugins subscribed to event '{event}'")
+            return results
+
+        logger.info(f"🔌 ROUTER: Found {len(plugin_ids)} subscribed plugin(s): {plugin_ids}")
+
         for plugin_id in plugin_ids:
             plugin = self.plugins[plugin_id]
 
             if not plugin.enabled:
+                logger.info(f"   ⊘ Skipping '{plugin_id}': disabled")
                 continue
 
             # Check execution condition (wake_word, etc.)
+            logger.info(f"   → Checking execution condition for '{plugin_id}'")
             if not await self._should_execute(plugin, data):
+                logger.info(f"   ⊘ Skipping '{plugin_id}': condition not met")
                 continue
 
             # Execute plugin
             try:
+                logger.info(f"   ▶ Executing '{plugin_id}' for event '{event}'")
                 context = PluginContext(
                     user_id=user_id,
                     event=event,
@@ -149,15 +163,30 @@ async def dispatch_event(
                 result = await self._execute_plugin(plugin, event, context)
 
                 if result:
+                    status_icon = "✓" if result.success else "✗"
+                    logger.info(
+                        f"   {status_icon} Plugin '{plugin_id}' completed: "
+                        f"success={result.success}, message={result.message}"
+                    )
                     results.append(result)
 
                     # If plugin says stop processing, break
                     if not result.should_continue:
-                        logger.info(f"Plugin '{plugin_id}' stopped further processing")
+                        logger.info(f"   ⊗ Plugin '{plugin_id}' stopped further processing")
                         break
 
             except Exception as e:
-                logger.error(f"Error executing plugin '{plugin_id}': {e}", exc_info=True)
+                # CRITICAL: Log exception details
+                logger.error(
+                    f"   ✗ Plugin '{plugin_id}' FAILED with exception: {e}",
+                    exc_info=True
+                )
+
+        # Add at end
+        logger.info(
+            f"🔌 ROUTER: Dispatch complete for '{event}': "
+            f"{len(results)} plugin(s) executed successfully"
+        )
 
         return results
 
diff --git a/backends/advanced/src/advanced_omi_backend/plugins/test_event/event_storage.py b/backends/advanced/src/advanced_omi_backend/plugins/test_event/event_storage.py
index 00bc674d..4fb618f9 100644
--- a/backends/advanced/src/advanced_omi_backend/plugins/test_event/event_storage.py
+++ b/backends/advanced/src/advanced_omi_backend/plugins/test_event/event_storage.py
@@ -118,29 +118,55 @@ async def log_event(
         Returns:
             Row ID of inserted event
         """
+        # Add at start
+        logger.debug(f"💾 STORAGE: Logging event '{event}' for user {user_id}")
+
         if not self.db:
+            logger.error("💾 STORAGE: Database connection not initialized!")
             raise RuntimeError("Event storage not initialized")
 
         timestamp = datetime.utcnow().isoformat()
-        data_json = json.dumps(data)
-        metadata_json = json.dumps(metadata) if metadata else None
 
-        cursor = await self.db.execute(
-            """
-            INSERT INTO plugin_events (timestamp, event, user_id, data, metadata)
-            VALUES (?, ?, ?, ?, ?)
-            """,
-            (timestamp, event, user_id, data_json, metadata_json)
-        )
+        # Add before serialization
+        logger.debug(f"💾 STORAGE: Serializing event data...")
+        try:
+            data_json = json.dumps(data)
+            metadata_json = json.dumps(metadata) if metadata else None
+        except Exception as e:
+            logger.error(
+                f"💾 STORAGE: JSON serialization failed for event '{event}': {e}",
+                exc_info=True
+            )
+            raise
 
-        await self.db.commit()
-        row_id = cursor.lastrowid
+        # Add before database operation
+        logger.debug(f"💾 STORAGE: Inserting into plugin_events table...")
 
-        logger.debug(
-            f"Logged event: {event} for user {user_id} (row_id={row_id})"
-        )
+        try:
+            cursor = await self.db.execute(
+                """
+                INSERT INTO plugin_events (timestamp, event, user_id, data, metadata)
+                VALUES (?, ?, ?, ?, ?)
+                """,
+                (timestamp, event, user_id, data_json, metadata_json)
+            )
+
+            await self.db.commit()
+            row_id = cursor.lastrowid
+
+            # Add success log
+            logger.info(
+                f"💾 STORAGE: Event '{event}' inserted successfully (row_id={row_id})"
+            )
+
+            return row_id
 
-        return row_id
+        except Exception as e:
+            logger.error(
+                f"💾 STORAGE: Database operation failed for event '{event}': {e}",
+                exc_info=True
+            )
+            raise
 
     async def get_events_by_type(self, event: str) -> List[Dict[str, Any]]:
         """
diff --git a/backends/advanced/src/advanced_omi_backend/plugins/test_event/plugin.py b/backends/advanced/src/advanced_omi_backend/plugins/test_event/plugin.py
index 6b96e078..59dd652e 100644
--- a/backends/advanced/src/advanced_omi_backend/plugins/test_event/plugin.py
+++ b/backends/advanced/src/advanced_omi_backend/plugins/test_event/plugin.py
@@ -115,11 +115,21 @@ async def on_conversation_complete(self, context: PluginContext) -> Optional[Plu
         Returns:
             PluginResult indicating success
         """
+        conversation_id = context.data.get('conversation_id', 'unknown')
+        duration = context.data.get('duration', 0)
+
+        # Add at start
+        logger.info(
+            f"📝 HANDLER: on_conversation_complete called for {conversation_id[:12]}"
+        )
+        logger.debug(f"   Event: {context.event}")
+        logger.debug(f"   Metadata: {context.metadata}")
+        logger.debug(f"   Duration: {duration}s")
+
         try:
-            conversation_id = context.data.get('conversation_id', 'unknown')
-            duration = context.data.get('duration', 0)
+            # Add before storage
+            logger.info(f"   💾 Storing event to SQLite database...")
 
-            # Log to storage
             row_id = await self.storage.log_event(
                 event=context.event,  # 'conversation.complete'
                 user_id=context.user_id,
@@ -127,27 +137,28 @@ async def on_conversation_complete(self, context: PluginContext) -> Optional[Plu
                 metadata=context.metadata
             )
 
-            self.event_count += 1
+            # Add after storage
+            logger.info(f"   ✓ Event stored successfully (row_id={row_id})")
 
-            logger.info(
-                f"📝 Logged conversation.complete event (row_id={row_id}): "
-                f"user={context.user_id}, "
-                f"conversation={conversation_id}, "
-                f"duration={duration:.2f}s"
-            )
+            self.event_count += 1
 
             return PluginResult(
                 success=True,
                 message=f"Conversation event logged (row_id={row_id})",
-                should_continue=True
+                data={"row_id": row_id},
+                should_continue=True,
             )
 
         except Exception as e:
-            logger.error(f"Error logging conversation event: {e}", exc_info=True)
+            # Enhance error logging
+            logger.error(
+                f"   ✗ Storage FAILED for {conversation_id[:12]}: {e}",
+                exc_info=True
+            )
             return PluginResult(
                 success=False,
                 message=f"Failed to log conversation event: {e}",
-                should_continue=True
+                should_continue=True,
             )
 
     async def on_memory_processed(self, context: PluginContext) -> Optional[PluginResult]:
diff --git a/backends/advanced/src/advanced_omi_backend/services/audio_stream/producer.py b/backends/advanced/src/advanced_omi_backend/services/audio_stream/producer.py
index 6ec4fad4..224d69f4 100644
--- a/backends/advanced/src/advanced_omi_backend/services/audio_stream/producer.py
+++ b/backends/advanced/src/advanced_omi_backend/services/audio_stream/producer.py
@@ -216,19 +216,29 @@ async def mark_websocket_disconnected(self, session_id: str):
         })
         logger.info(f"🔌 Marked websocket disconnected for session {session_id}")
 
-    async def finalize_session(self, session_id: str):
+    async def finalize_session(self, session_id: str, completion_reason: str = None):
         """
         Mark session as finalizing, send end marker, and clean up buffer.
 
         Args:
             session_id: Session identifier
+            completion_reason: Optional reason for session completion (e.g., "websocket_disconnect", "user_stopped")
+                              This is set atomically with status to avoid race conditions.
         """
         session_key = f"audio:session:{session_id}"
 
-        await self.redis_client.hset(session_key, mapping={
+        # Build mapping with status and optional completion_reason
+        mapping = {
             "status": "finalizing",
             "finalized_at": str(time.time())
-        })
+        }
+
+        # Set completion_reason atomically with status to prevent race conditions
+        if completion_reason:
+            mapping["completion_reason"] = completion_reason
+            logger.info(f"📊 Finalizing session {session_id} with reason: {completion_reason}")
+
+        await self.redis_client.hset(session_key, mapping=mapping)
 
         # Send end_marker to Redis stream so streaming consumer can close the connection
         if session_id in self.session_buffers:
diff --git a/backends/advanced/src/advanced_omi_backend/utils/audio_utils.py b/backends/advanced/src/advanced_omi_backend/utils/audio_utils.py
index ce81bbb8..f8ba07a3 100644
--- a/backends/advanced/src/advanced_omi_backend/utils/audio_utils.py
+++ b/backends/advanced/src/advanced_omi_backend/utils/audio_utils.py
@@ -3,15 +3,18 @@
 ###############################################################################
 
 import asyncio
+import io
 import logging
 import os
 import time
 import uuid as uuid_lib
+import wave
 from pathlib import Path
 
 # Type import to avoid circular imports
 from typing import TYPE_CHECKING, Optional
 
+import numpy as np
 from wyoming.audio import AudioChunk
 
 if TYPE_CHECKING:
@@ -30,10 +33,85 @@ class AudioValidationError(Exception):
     pass
 
 
+async def resample_audio_with_ffmpeg(
+    audio_data: bytes,
+    input_sample_rate: int,
+    input_channels: int,
+    input_sample_width: int,
+    target_sample_rate: int,
+    target_channels: int = 1
+) -> bytes:
+    """
+    Resample audio using FFmpeg with stdin/stdout pipes (no disk I/O).
+
+    Args:
+        audio_data: Raw PCM audio bytes
+        input_sample_rate: Input sample rate in Hz
+        input_channels: Number of input channels
+        input_sample_width: Input sample width in bytes (2 for 16-bit, 4 for 32-bit)
+        target_sample_rate: Target sample rate in Hz
+        target_channels: Target number of channels (default: 1 for mono)
+
+    Returns:
+        Resampled PCM audio bytes (16-bit signed little-endian)
+
+    Raises:
+        RuntimeError: If FFmpeg resampling fails
+    """
+    # Determine FFmpeg format based on sample width
+    if input_sample_width == 2:
+        input_format = "s16le"  # 16-bit signed little-endian
+    elif input_sample_width == 4:
+        input_format = "s32le"  # 32-bit signed little-endian
+    else:
+        raise AudioValidationError(
+            f"Unsupported sample width: {input_sample_width} bytes (only 2 or 4 supported)"
+        )
+
+    # FFmpeg command for resampling via pipes
+    # pipe:0 = stdin, pipe:1 = stdout
+    cmd = [
+        "ffmpeg",
+        "-f", input_format,
+        "-ar", str(input_sample_rate),
+        "-ac", str(input_channels),
+        "-i", "pipe:0",  # Read from stdin
+        "-ar", str(target_sample_rate),
+        "-ac", str(target_channels),
+        "-f", "s16le",  # Always output 16-bit
+        "pipe:1",  # Write to stdout
+    ]
+
+    # Run FFmpeg with piped I/O
+    process = await asyncio.create_subprocess_exec(
+        *cmd,
+        stdin=asyncio.subprocess.PIPE,
+        stdout=asyncio.subprocess.PIPE,
+        stderr=asyncio.subprocess.PIPE,
+    )
+
+    # Send input data and get output
+    stdout, stderr = await process.communicate(input=audio_data)
+
+    if process.returncode != 0:
+        error_msg = stderr.decode() if stderr else "Unknown error"
+        audio_logger.error(f"FFmpeg resampling failed: {error_msg}")
+        raise RuntimeError(f"Audio resampling failed: {error_msg}")
+
+    audio_logger.info(
+        f"Resampled audio: {input_sample_rate}Hz/{input_channels}ch → "
+        f"{target_sample_rate}Hz/{target_channels}ch "
+        f"({len(audio_data)} → {len(stdout)} bytes)"
+    )
+
+    return stdout
+
+
 async def validate_and_prepare_audio(
     audio_data: bytes,
     expected_sample_rate: int = 16000,
-    convert_to_mono: bool = True
+    convert_to_mono: bool = True,
+    auto_resample: bool = False
 ) -> tuple[bytes, int, int, int, float]:
     """
     Validate WAV audio data and prepare it for processing.
@@ -42,6 +120,7 @@ async def validate_and_prepare_audio(
         audio_data: Raw WAV file bytes
         expected_sample_rate: Expected sample rate (default: 16000 Hz)
         convert_to_mono: Whether to convert stereo to mono (default: True)
+        auto_resample: Whether to automatically resample audio if sample rate doesn't match (default: False)
 
     Returns:
         Tuple of (processed_audio_data, sample_rate, sample_width, channels, duration)
@@ -49,10 +128,6 @@ async def validate_and_prepare_audio(
     Raises:
         AudioValidationError: If audio validation fails
     """
-    import io
-    import wave
-    import numpy as np
-
     try:
         # Parse WAV file
         with wave.open(io.BytesIO(audio_data), "rb") as wav_file:
@@ -68,13 +143,36 @@ async def validate_and_prepare_audio(
     except Exception as e:
         raise AudioValidationError(f"Invalid WAV file: {str(e)}")
 
-    # Validate sample rate
+    # Handle sample rate mismatch
     if sample_rate != expected_sample_rate:
-        raise AudioValidationError(
-            f"Sample rate must be {expected_sample_rate}Hz, got {sample_rate}Hz"
-        )
+        if auto_resample:
+            audio_logger.info(
+                f"Auto-resampling audio from {sample_rate}Hz to {expected_sample_rate}Hz"
+            )
+            # Resample audio using FFmpeg (with pipes, no disk I/O)
+            processed_audio = await resample_audio_with_ffmpeg(
+                audio_data=processed_audio,
+                input_sample_rate=sample_rate,
+                input_channels=channels,
+                input_sample_width=sample_width,
+                target_sample_rate=expected_sample_rate,
+                target_channels=1 if convert_to_mono else channels
+            )
+            # Update metadata after resampling
+            sample_rate = expected_sample_rate
+            sample_width = 2  # FFmpeg outputs 16-bit
+            if convert_to_mono:
+                channels = 1
+            # Recalculate duration
+            duration = len(processed_audio) / (sample_rate * sample_width * channels)
+            # Skip stereo-to-mono conversion since resampling already handled it
+            convert_to_mono = False
+        else:
+            raise AudioValidationError(
+                f"Sample rate must be {expected_sample_rate}Hz, got {sample_rate}Hz"
+            )
 
-    # Convert stereo to mono if requested
+    # Convert stereo to mono if requested and not already done
     if convert_to_mono and channels == 2:
         audio_logger.info(f"Converting stereo audio to mono")
 
diff --git a/backends/advanced/src/advanced_omi_backend/workers/conversation_jobs.py b/backends/advanced/src/advanced_omi_backend/workers/conversation_jobs.py
index d0650f75..26b820a6 100644
--- a/backends/advanced/src/advanced_omi_backend/workers/conversation_jobs.py
+++ b/backends/advanced/src/advanced_omi_backend/workers/conversation_jobs.py
@@ -8,7 +8,7 @@
 import logging
 import time, os
 from datetime import datetime
-from typing import Dict, Any
+from typing import Dict, Any, Optional
 from rq.job import Job
 from rq.exceptions import NoSuchJobError
 
@@ -482,6 +482,11 @@ async def open_conversation_job(
                             'word_count': speech_analysis.get('word_count', 0),
                         }
 
+                        logger.info(
+                            f"🔌 DISPATCH: transcript.streaming event "
+                            f"(conversation={conversation_id[:12]}, segment_id={session_id}_{current_count})"
+                        )
+
                         plugin_results = await plugin_router.dispatch_event(
                             event='transcript.streaming',
                             user_id=user_id,
@@ -489,6 +494,10 @@ async def open_conversation_job(
                             metadata={'client_id': client_id}
                         )
 
+                        logger.info(
+                            f"🔌 RESULT: transcript.streaming dispatched to {len(plugin_results) if plugin_results else 0} plugins"
+                        )
+
                         if plugin_results:
                             logger.info(f"📌 Triggered {len(plugin_results)} streaming transcript plugins")
                             for result in plugin_results:
@@ -509,17 +518,18 @@ async def open_conversation_job(
     )
 
     # Determine end reason based on how we exited the loop
-    # Check session completion_reason from Redis (set by WebSocket controller on disconnect)
+    # Check session completion_reason from Redis (set atomically with status by finalize_session)
     completion_reason = await redis_client.hget(session_key, "completion_reason")
     completion_reason_str = completion_reason.decode() if completion_reason else None
 
     # Determine end_reason with proper precedence:
-    # 1. websocket_disconnect (explicit disconnect from client)
+    # 1. completion_reason from Redis (set by WebSocket controller: websocket_disconnect, user_stopped)
     # 2. inactivity_timeout (no speech for SPEECH_INACTIVITY_THRESHOLD_SECONDS)
     # 3. max_duration (conversation exceeded max runtime)
-    # 4. user_stopped (user manually stopped recording)
-    if completion_reason_str == "websocket_disconnect":
-        end_reason = "websocket_disconnect"
+    # 4. user_stopped (fallback for any other exit condition)
+    if completion_reason_str:
+        end_reason = completion_reason_str
+        logger.info(f"📊 Using completion_reason from session: {end_reason}")
     elif timeout_triggered:
         end_reason = "inactivity_timeout"
     elif time.time() - start_time > max_runtime:
@@ -676,41 +686,38 @@ async def open_conversation_job(
     # Wait a moment to ensure jobs are registered in RQ
     await asyncio.sleep(0.5)
 
-    # Trigger conversation-level plugins
+    # Enqueue conversation.complete event dispatch job
+    # This unifies the dispatch path for both WebSocket and file upload processing
     try:
-        plugin_router = get_plugin_router()
-        if plugin_router:
-            # Get conversation data for plugin context
-            conversation_model = await Conversation.find_one(
-                Conversation.conversation_id == conversation_id
-            )
-
-            plugin_data = {
-                'conversation': {
-                    'conversation_id': conversation_id,
-                    'client_id': client_id,
-                    'user_id': user_id,
-                },
-                'transcript': conversation_model.transcript if conversation_model else "",
-                'duration': time.time() - start_time,
-                'conversation_id': conversation_id,
-            }
-
-            plugin_results = await plugin_router.dispatch_event(
-                event='conversation.complete',
-                user_id=user_id,
-                data=plugin_data,
-                metadata={'end_reason': end_reason}
-            )
+        from rq import Queue
+
+        default_queue = Queue('default', connection=redis_conn)
+
+        dispatch_job = default_queue.enqueue(
+            dispatch_conversation_complete_event_job,
+            conversation_id,
+            client_id,
+            user_id,
+            end_reason,  # Pass the end_reason we determined earlier
+            job_timeout=120,
+            result_ttl=600,
+            job_id=f"event_complete_{conversation_id[:12]}",
+            description=f"Dispatch conversation complete event ({end_reason})",
+            meta={"client_id": client_id}
+        )
 
-            if plugin_results:
-                logger.info(f"📌 Triggered {len(plugin_results)} conversation-level plugins")
-                for result in plugin_results:
-                    if result.message:
-                        logger.info(f"  Plugin result: {result.message}")
+        logger.info(
+            f"📥 Enqueued conversation.complete dispatch job {dispatch_job.id} "
+            f"for {conversation_id[:12]} (end_reason={end_reason})"
+        )
 
     except Exception as e:
-        logger.warning(f"⚠️ Error triggering conversation-level plugins: {e}")
+        logger.error(
+            f"❌ Failed to enqueue conversation.complete dispatch job "
+            f"for {conversation_id[:12]}: {e}",
+            exc_info=True
+        )
+        # Don't fail the entire job - conversation is saved, just plugins won't be notified
 
     # Call shared cleanup/restart logic
     return await handle_end_of_conversation(
@@ -858,20 +865,23 @@ async def dispatch_conversation_complete_event_job(
     conversation_id: str,
     client_id: str,
     user_id: str,
+    end_reason: Optional[str] = None,
     *,
     redis_client=None
 ) -> Dict[str, Any]:
     """
-    Dispatch conversation.complete plugin event for file upload processing.
+    Dispatch conversation.complete plugin event for all conversation sources.
 
-    This job runs at the end of the post-conversation job chain to ensure
-    plugins receive the conversation.complete event for uploaded audio files.
-    WebSocket streaming dispatches this event in open_conversation_job instead.
+    This job runs at the end of conversation processing to ensure plugins
+    receive the conversation.complete event with the correct end_reason.
+    Used by both file upload and WebSocket streaming paths.
 
     Args:
         conversation_id: Conversation ID
         client_id: Client ID
         user_id: User ID
+        end_reason: Reason the conversation ended (e.g., 'file_upload', 'websocket_disconnect', 'user_stopped')
+                   Defaults to 'file_upload' for backward compatibility
         redis_client: Redis client (injected by decorator)
 
     Returns:
@@ -898,22 +908,40 @@ async def dispatch_conversation_complete_event_job(
     try:
         # Get or initialize plugin router (same pattern as transcription_jobs.py)
         plugin_router = get_plugin_router()
+
         if not plugin_router:
-            logger.info("🔧 Initializing plugin router in worker process...")
+            logger.warning("🔧 Plugin router not found in worker process - attempting initialization...")
             plugin_router = init_plugin_router()
 
-            # Initialize all plugins asynchronously (same as app_factory.py)
             if plugin_router:
+                logger.info(f"🔧 Plugin router initialized with {len(plugin_router.plugins)} plugin(s)")
+
+                # Initialize all plugins
                 for plugin_id, plugin in plugin_router.plugins.items():
                     try:
+                        logger.info(f"   Initializing plugin '{plugin_id}'...")
                         await plugin.initialize()
-                        logger.info(f"✅ Plugin '{plugin_id}' initialized")
+                        logger.info(f"   ✓ Plugin '{plugin_id}' initialized")
                     except Exception as e:
-                        logger.error(f"Failed to initialize plugin '{plugin_id}': {e}")
+                        logger.error(f"   ✗ Failed to initialize plugin '{plugin_id}': {e}", exc_info=True)
+            else:
+                logger.error("🔧 Plugin router initialization FAILED - router is None")
 
+        # CRITICAL CHECK: Fail loudly if no router
         if not plugin_router:
-            logger.warning("⚠️ Plugin router could not be initialized, skipping event dispatch")
-            return {"success": True, "skipped": True, "reason": "No plugin router"}
+            error_msg = (
+                f"❌ Plugin router could not be initialized in worker process. "
+                f"conversation.complete event for {conversation_id[:12]} will NOT be dispatched!"
+            )
+            logger.error(error_msg)
+
+            return {
+                "success": False,
+                "skipped": True,
+                "reason": "No plugin router",
+                "conversation_id": conversation_id,
+                "error": error_msg
+            }
 
         plugin_data = {
             'conversation': {
@@ -925,16 +953,28 @@ async def dispatch_conversation_complete_event_job(
             'conversation_id': conversation_id,
         }
 
+        # Use provided end_reason or default to 'file_upload' for backward compatibility
+        actual_end_reason = end_reason or 'file_upload'
+
+        logger.info(
+            f"🔌 DISPATCH: conversation.complete event for {conversation_id[:12]} "
+            f"(end_reason={actual_end_reason}, user={user_id}, client={client_id})"
+        )
+
         plugin_results = await plugin_router.dispatch_event(
             event='conversation.complete',
             user_id=user_id,
             data=plugin_data,
-            metadata={'end_reason': 'file_upload'}
+            metadata={'end_reason': actual_end_reason}
         )
 
+        logger.info(
+            f"🔌 RESULT: conversation.complete dispatched to {len(plugin_results) if plugin_results else 0} plugins"
+        )
         if plugin_results:
             logger.info(f"📌 Triggered {len(plugin_results)} conversation-level plugins")
             for result in plugin_results:
+                logger.info(f"   Plugin result: success={result.success}, message={result.message}")
                 if result.message:
                     logger.info(f"  Plugin result: {result.message}")
 
diff --git a/backends/advanced/src/advanced_omi_backend/workers/memory_jobs.py b/backends/advanced/src/advanced_omi_backend/workers/memory_jobs.py
index ee02b065..1a5700bd 100644
--- a/backends/advanced/src/advanced_omi_backend/workers/memory_jobs.py
+++ b/backends/advanced/src/advanced_omi_backend/workers/memory_jobs.py
@@ -271,6 +271,11 @@ async def process_memory_job(conversation_id: str, *, redis_client=None) -> Dict
                         'conversation_id': conversation_id,
                     }
 
+                    logger.info(
+                        f"🔌 DISPATCH: memory.processed event "
+                        f"(conversation={conversation_id[:12]}, memories={len(created_memory_ids)})"
+                    )
+
                     plugin_results = await plugin_router.dispatch_event(
                         event='memory.processed',
                         user_id=user_id,
@@ -281,6 +286,10 @@ async def process_memory_job(conversation_id: str, *, redis_client=None) -> Dict
                         }
                     )
 
+                    logger.info(
+                        f"🔌 RESULT: memory.processed dispatched to {len(plugin_results) if plugin_results else 0} plugins"
+                    )
+
                     if plugin_results:
                         logger.info(f"📌 Triggered {len(plugin_results)} memory-level plugins")
                         for result in plugin_results:
diff --git a/backends/advanced/src/advanced_omi_backend/workers/speaker_jobs.py b/backends/advanced/src/advanced_omi_backend/workers/speaker_jobs.py
index f7379108..fe130c28 100644
--- a/backends/advanced/src/advanced_omi_backend/workers/speaker_jobs.py
+++ b/backends/advanced/src/advanced_omi_backend/workers/speaker_jobs.py
@@ -207,9 +207,18 @@ async def recognise_speakers_job(
     actual_transcript_text = transcript_text or transcript_version.transcript or ""
     actual_words = words if words else []
 
-    # If words not provided, we need to get them from metadata
-    if not actual_words and transcript_version.metadata:
-        actual_words = transcript_version.metadata.get("words", [])
+    # If words not provided, extract from segments (single source of truth)
+    if not actual_words and transcript_version.segments:
+        actual_words = []
+        for seg in transcript_version.segments:
+            for word in seg.words:
+                actual_words.append({
+                    "word": word.word,
+                    "start": word.start,
+                    "end": word.end,
+                    "confidence": word.confidence
+                })
+        logger.info(f"🔤 Extracted {len(actual_words)} words from {len(transcript_version.segments)} segments")
 
     if not actual_transcript_text:
         logger.warning(f"🎤 No transcript text found in version {version_id}")
@@ -342,13 +351,27 @@ async def recognise_speakers_job(
                 continue
 
             speaker_name = seg.get("identified_as") or seg.get("speaker", "Unknown")
+
+            # Extract words from speaker service response (already matched to this segment)
+            words_data = seg.get("words", [])
+            segment_words = [
+                Conversation.Word(
+                    word=w.get("word", ""),
+                    start=w.get("start", 0.0),
+                    end=w.get("end", 0.0),
+                    confidence=w.get("confidence")
+                )
+                for w in words_data
+            ]
+
             updated_segments.append(
                 Conversation.SpeakerSegment(
                     start=seg.get("start", 0),
                     end=seg.get("end", 0),
                     text=text,
                     speaker=speaker_name,
-                    confidence=seg.get("confidence")
+                    confidence=seg.get("confidence"),
+                    words=segment_words  # Use words from speaker service
                 )
             )
 
diff --git a/backends/advanced/src/advanced_omi_backend/workers/transcription_jobs.py b/backends/advanced/src/advanced_omi_backend/workers/transcription_jobs.py
index f492c910..27eb3814 100644
--- a/backends/advanced/src/advanced_omi_backend/workers/transcription_jobs.py
+++ b/backends/advanced/src/advanced_omi_backend/workers/transcription_jobs.py
@@ -252,14 +252,21 @@ async def transcribe_full_audio_job(
                     'word_count': len(words),
                 }
 
-                logger.info(f"🔍 DEBUG: Dispatching transcript.batch event with user_id={user_id}, client_id={client_id}")
+                logger.info(
+                    f"🔌 DISPATCH: transcript.batch event "
+                    f"(conversation={conversation_id[:12]}, words={len(words)})"
+                )
+
                 plugin_results = await plugin_router.dispatch_event(
                     event='transcript.batch',
                     user_id=user_id,
                     data=plugin_data,
                     metadata={'client_id': client_id}
                 )
-                logger.info(f"🔍 DEBUG: Event dispatch returned {len(plugin_results) if plugin_results else 0} results")
+
+                logger.info(
+                    f"🔌 RESULT: transcript.batch dispatched to {len(plugin_results) if plugin_results else 0} plugins"
+                )
 
                 if plugin_results:
                     logger.info(f"✅ Triggered {len(plugin_results)} transcript plugins in batch mode")
@@ -414,7 +421,6 @@ async def transcribe_full_audio_job(
         "audio_file_size": len(wav_data),
         "segment_count": len(segments),
         "word_count": len(words),
-        "words": words,  # Store words for speaker recognition job to read
         "speaker_recognition": {"enabled": False, "reason": "handled_by_separate_job"},
     }
 
diff --git a/backends/advanced/worker_orchestrator.py b/backends/advanced/worker_orchestrator.py
index 0929bdd0..fb4b6a10 100755
--- a/backends/advanced/worker_orchestrator.py
+++ b/backends/advanced/worker_orchestrator.py
@@ -31,9 +31,9 @@
 
 # Import orchestrator components
 from src.advanced_omi_backend.workers.orchestrator import (
+    HealthMonitor,
     OrchestratorConfig,
     ProcessManager,
-    HealthMonitor,
     build_worker_definitions,
 )
 
@@ -213,7 +213,7 @@ async def run(self):
             await self.shutdown_event.wait()
 
         except Exception as e:
-            logger.error(f"❌ Orchestrator error: {e}", exc_info=True)
+            logger.exception(f"❌ Orchestrator error: {e}")
             raise
         finally:
             # Always perform shutdown
@@ -233,7 +233,7 @@ async def main():
         sys.exit(0)
 
     except Exception as e:
-        logger.error(f"Fatal error: {e}", exc_info=True)
+        logger.exception(f"Fatal error: {e}")
         sys.exit(1)
 
 
diff --git a/extras/speaker-recognition/src/simple_speaker_recognition/api/routers/identification.py b/extras/speaker-recognition/src/simple_speaker_recognition/api/routers/identification.py
index 2b326bf7..e6c02e95 100644
--- a/extras/speaker-recognition/src/simple_speaker_recognition/api/routers/identification.py
+++ b/extras/speaker-recognition/src/simple_speaker_recognition/api/routers/identification.py
@@ -436,13 +436,13 @@ async def diarize_identify_match(
                 word_start = word.get("start", 0.0)
                 word_end = word.get("end", 0.0)
                 word_mid = (word_start + word_end) / 2
-                
+
                 # Word belongs to this segment if its midpoint is within range
                 if start_time <= word_mid <= end_time:
-                    segment_words.append(word.get("word", ""))
-            
+                    segment_words.append(word)  # Keep full word object with timestamps
+
             # Create segment with matched text
-            segment_text = " ".join(segment_words).strip()
+            segment_text = " ".join(w.get("word", "") for w in segment_words).strip()
             
             if speaker_info and confidence >= similarity_threshold:
                 # Identified speaker
@@ -454,7 +454,8 @@ async def diarize_identify_match(
                     "identified_as": speaker_info["name"],
                     "speaker_id": speaker_info["id"],
                     "confidence": round(float(confidence), 3),
-                    "status": "identified"
+                    "status": "identified",
+                    "words": segment_words  # Include word-level timestamps
                 })
             else:
                 # Unknown speaker
@@ -466,7 +467,8 @@ async def diarize_identify_match(
                     "identified_as": None,
                     "speaker_id": None,
                     "confidence": round(float(confidence), 3) if confidence else 0.0,
-                    "status": "unknown"
+                    "status": "unknown",
+                    "words": segment_words  # Include word-level timestamps
                 })
         
         # Create summary
diff --git a/extras/speaker-recognition/tests/test_speaker_service_integration.py b/extras/speaker-recognition/tests/test_speaker_service_integration.py
index 58e55b61..1ee60bd7 100644
--- a/extras/speaker-recognition/tests/test_speaker_service_integration.py
+++ b/extras/speaker-recognition/tests/test_speaker_service_integration.py
@@ -276,7 +276,7 @@ def test_speaker_recognition_pipeline(speaker_service):
     # Phase 6: Conversation Processing (Basic API Functionality)
     print("🗣️ Phase 6: Conversation processing...")
     print("  Note: Testing API functionality, not requiring perfect speaker identification")
-    
+
     with open(conversation_file, "rb") as f:
         files = {"file": (conversation_file.name, f, "audio/wav")}
         params = {
@@ -286,26 +286,26 @@ def test_speaker_recognition_pipeline(speaker_service):
             "min_speakers": "1",
             "max_speakers": "4",
         }
-        
+
         print(f"  Processing conversation audio (file size: {conversation_file.stat().st_size / (1024*1024):.1f}MB)...")
         r = requests.post(f"{SPEAKER_SERVICE_URL}/diarize-and-identify", files=files, params=params, timeout=300)
-    
+
     assert r.status_code == 200, f"Conversation processing failed: {r.status_code} {r.text[:500]}"
     result = r.json()
-    
+
     # Basic structure validation
     assert "segments" in result, "No segments field in response"
     assert isinstance(result["segments"], list), "Segments is not a list"
     assert len(result["segments"]) > 0, "No segments found in conversation"
-    
+
     # Count identified vs unknown segments
     identified_segments = 0
     total_segments = len(result["segments"])
     identified_speakers = set()
-    
+
     for seg in result["segments"]:
         assert "start" in seg and "end" in seg and "speaker" in seg, "Invalid segment structure"
-        
+
         # Check if speaker was identified (correct field names)
         if seg.get("status") == "identified" and seg.get("identified_id"):
             identified_segments += 1
@@ -314,15 +314,105 @@ def test_speaker_recognition_pipeline(speaker_service):
             confidence = seg.get("confidence", 0.0)
             identified_speakers.add(speaker_id)
             print(f"    Segment identified: {speaker_name} ({speaker_id}) confidence={confidence:.3f}")
-    
+
     print(f"  ✅ Found {total_segments} segments, {identified_segments} with speaker identification")
     print(f"  ✅ Identified speakers: {identified_speakers}")
-    
+
     # Success criteria: API works and produces valid output
     # We don't require perfect speaker identification since that depends on audio quality
     assert total_segments > 0, "No segments produced"
     print("✅ Conversation processing API works correctly")
-    
+
+    # Phase 7: Word-Level Data Validation
+    print("📝 Phase 7: Validating word-level timestamp data in segments...")
+    segments_with_words = 0
+    total_words_found = 0
+
+    for seg in result["segments"]:
+        # Each segment should have a words array (empty segments might have empty array)
+        assert "words" in seg, f"Segment missing 'words' field: {seg}"
+        words = seg.get("words", [])
+
+        if len(words) > 0:
+            segments_with_words += 1
+            total_words_found += len(words)
+
+            # Validate word structure
+            for word in words[:3]:  # Check first 3 words of each segment
+                assert "word" in word, f"Word missing 'word' field: {word}"
+                assert "start" in word, f"Word missing 'start' field: {word}"
+                assert "end" in word, f"Word missing 'end' field: {word}"
+                # confidence is optional
+                assert isinstance(word["start"], (int, float)), f"Word 'start' should be numeric: {word}"
+                assert isinstance(word["end"], (int, float)), f"Word 'end' should be numeric: {word}"
+
+    print(f"  ✅ Word-level data: {segments_with_words}/{total_segments} segments have words ({total_words_found} total words)")
+    assert segments_with_words > 0, "No segments contain word-level timestamp data"
+    assert total_words_found > 0, "No words found across all segments"
+    print("✅ Word-level timestamp data validated successfully")
+
+    # Phase 8: Diarize-Identify-Match Endpoint (Backend Integration Mode)
+    print("🔗 Phase 8: Testing /v1/diarize-identify-match endpoint (backend integration mode)...")
+    print("  This endpoint matches transcript words to diarization segments")
+
+    # Create sample transcript_data with word-level timestamps
+    sample_transcript_data = {
+        "text": "Hello everyone. This is a test conversation.",
+        "words": [
+            {"word": "Hello", "start": 0.5, "end": 0.8, "confidence": 0.95},
+            {"word": "everyone", "start": 0.9, "end": 1.3, "confidence": 0.92},
+            {"word": "This", "start": 2.0, "end": 2.2, "confidence": 0.96},
+            {"word": "is", "start": 2.3, "end": 2.4, "confidence": 0.98},
+            {"word": "a", "start": 2.5, "end": 2.6, "confidence": 0.97},
+            {"word": "test", "start": 2.7, "end": 3.0, "confidence": 0.94},
+            {"word": "conversation", "start": 3.1, "end": 3.8, "confidence": 0.93},
+        ]
+    }
+
+    with open(conversation_file, "rb") as f:
+        files = {"file": (conversation_file.name, f, "audio/wav")}
+        data = {
+            "transcript_data": json.dumps(sample_transcript_data),
+            "user_id": "1",
+            "min_duration": "1.0",
+            "similarity_threshold": "0.10",
+            "min_speakers": "1",
+            "max_speakers": "4",
+        }
+
+        r = requests.post(f"{SPEAKER_SERVICE_URL}/v1/diarize-identify-match", files=files, data=data, timeout=300)
+
+    assert r.status_code == 200, f"/v1/diarize-identify-match failed: {r.status_code} {r.text[:500]}"
+    match_result = r.json()
+
+    # Validate response structure
+    assert "segments" in match_result, "No segments in diarize-identify-match response"
+    match_segments = match_result["segments"]
+    assert len(match_segments) > 0, "No segments returned from diarize-identify-match"
+
+    # Validate that segments contain matched words
+    match_segments_with_words = 0
+    match_total_words = 0
+
+    for seg in match_segments:
+        assert "text" in seg, "Segment missing 'text' field"
+        assert "words" in seg, "Segment missing 'words' field (should include matched transcript words)"
+        words = seg.get("words", [])
+
+        if len(words) > 0:
+            match_segments_with_words += 1
+            match_total_words += len(words)
+
+            # Validate word structure matches input transcript_data
+            for word in words[:2]:  # Check first 2 words
+                assert "word" in word, f"Word missing 'word' field: {word}"
+                assert "start" in word, f"Word missing 'start' field: {word}"
+                assert "end" in word, f"Word missing 'end' field: {word}"
+
+    print(f"  ✅ Diarize-identify-match: {match_segments_with_words}/{len(match_segments)} segments have matched words ({match_total_words} total)")
+    assert match_segments_with_words > 0, "No segments contain matched transcript words"
+    print("✅ /v1/diarize-identify-match endpoint validated successfully")
+
     # Final Summary
     print("=" * 80)
     print("🎉 SPEAKER RECOGNITION INTEGRATION TEST COMPLETED SUCCESSFULLY")
@@ -333,6 +423,8 @@ def test_speaker_recognition_pipeline(speaker_service):
     print(f"✅ Database persistence: PASS (2 speakers)")
     print(f"✅ Individual identification: PASS (both speakers)")
     print(f"✅ Conversation processing: PASS ({total_segments} segments, {identified_segments} identified)")
+    print(f"✅ Word-level timestamps: PASS ({total_words_found} words in {segments_with_words} segments)")
+    print(f"✅ Diarize-identify-match: PASS ({match_total_words} matched words in {match_segments_with_words} segments)")
     print("=" * 80)
 
 
diff --git a/tests/infrastructure/infra_tests.robot b/tests/infrastructure/infra_tests.robot
index 59ac95c1..783329ae 100644
--- a/tests/infrastructure/infra_tests.robot
+++ b/tests/infrastructure/infra_tests.robot
@@ -87,15 +87,58 @@ Verify Workers Still Running In Container
 
 Restart Workers Container
     [Documentation]    Restart the workers container to restore registration
+    ...                Uses docker compose for more reliable restart
     Log To Console    \n🔄 Restarting workers container...
 
-    ${result}=    Run Process    docker    restart    ${WORKERS_CONTAINER}    shell=False
-    Should Be Equal As Integers    ${result.rc}    0
+    # Use docker compose restart for more reliable restart
+    ${result}=    Run Process    docker    compose    -f    docker-compose-test.yml    restart    workers-test
+    ...    cwd=${BACKEND_DIR}    shell=False
+
+    IF    ${result.rc} != 0
+        Log To Console    ⚠️ Docker compose restart failed, attempting docker restart...
+        Log To Console    stderr: ${result.stderr}
+        # Fallback to direct docker restart
+        ${result}=    Run Process    docker    restart    ${WORKERS_CONTAINER}    shell=False
+    END
+
+    Should Be Equal As Integers    ${result.rc}    0    msg=Failed to restart workers: ${result.stderr}
 
-    # Wait for workers to start
-    Sleep    5s    reason=Wait for workers to initialize
+    # Wait for workers to start and register
+    Sleep    10s    reason=Wait for workers to initialize and register
     Log To Console    ✅ Workers container restarted
 
+Verify Workers Healthy Or Restart
+    [Documentation]    Check if workers are healthy, restart if needed
+    ...                This ensures subsequent tests have a working environment
+    Log To Console    \n🧹 Cleanup: Verifying worker health...
+
+    TRY
+        ${worker_count}=    Get Worker Count From Health Endpoint
+        Log To Console    Current worker count: ${worker_count}
+
+        IF    ${worker_count} < 6
+            Log To Console    ⚠️ Only ${worker_count} workers detected, restarting to restore health...
+            Restart Workers Container
+
+            # Verify workers recovered after restart
+            Sleep    10s    reason=Wait for workers to fully initialize
+            ${new_count}=    Get Worker Count From Health Endpoint
+            Log To Console    Worker count after restart: ${new_count}
+
+            IF    ${new_count} < 6
+                Log To Console    ⚠️ WARNING: Only ${new_count} workers after restart (expected 6+)
+            ELSE
+                Log To Console    ✅ Workers healthy: ${new_count} workers registered
+            END
+        ELSE
+            Log To Console    ✅ Workers healthy: ${worker_count} workers registered (no restart needed)
+        END
+    EXCEPT    AS    ${error}
+        Log To Console    ⚠️ Failed to verify worker health: ${error}
+        Log To Console    Attempting emergency restart...
+        Restart Workers Container
+    END
+
 *** Test Cases ***
 Worker Registration Loss Detection Test
     [Documentation]    Test that the system can automatically recover when workers lose Redis registration
@@ -169,10 +212,7 @@ Worker Registration Loss Detection Test
         Fail    Self-healing mechanism not working: Workers did not re-register after 90 seconds
     END
 
-    # Cleanup: Always restart workers after this test to ensure subsequent tests work
-    [Teardown]    Run Keywords
-    ...    Log To Console    \n🧹 Cleanup: Restarting workers for subsequent tests
-    ...    AND    Restart Workers Container
+    [Teardown]    Verify Workers Healthy Or Restart
 
 Worker Count Validation Test
     [Documentation]    Verify the health endpoint accurately reports worker counts
@@ -278,6 +318,9 @@ WebSocket Disconnect Conversation End Reason Test
     # Send audio fast (no realtime pacing) to trigger conversation creation
     Send Audio Chunks To Stream    ${stream_id}    ${TEST_AUDIO_FILE}    num_chunks=200
 
+    # Initialize conversation_id to None (will be set when found)
+    ${conversation_id}=    Set Variable    ${None}
+
     # Keep sending audio in a loop to prevent inactivity timeout while waiting for conversation
     # We need to continuously send audio because SPEECH_INACTIVITY_THRESHOLD_SECONDS=2
     FOR    ${i}    IN RANGE    20    # Send 20 batches while waiting
diff --git a/tests/integration/audio_streaming_integration_tests.robot b/tests/integration/audio_streaming_integration_tests.robot
index b9c5e6fd..f34b7984 100644
--- a/tests/integration/audio_streaming_integration_tests.robot
+++ b/tests/integration/audio_streaming_integration_tests.robot
@@ -170,10 +170,10 @@ Session Cleaned Up After Stream Close
     # Wait for finalization
     Sleep    2s
 
-    # Verify session is finalized or complete (jobs may finish quickly for short streams)
+    # Verify session is finalized or finished (jobs may finish quickly for short streams)
     ${session_after}=    Get Redis Session Data    ${client_id}
-    Should Be True    '${session_after}[status]' in ['finalizing', 'complete']
-    ...    Session status should be finalizing or complete, got: ${session_after}[status]
+    Should Be True    '${session_after}[status]' in ['finalizing', 'finished']
+    ...    Session status should be finalizing or finished, got: ${session_after}[status]
 
     Log    ✅ Session status updated to ${session_after}[status]
 
diff --git a/tests/integration/plugin_event_tests.robot b/tests/integration/plugin_event_tests.robot
index fd9056c3..f78649ad 100644
--- a/tests/integration/plugin_event_tests.robot
+++ b/tests/integration/plugin_event_tests.robot
@@ -160,9 +160,9 @@ WebSocket Disconnect Should Trigger Conversation Complete Event
     ${conversation_id}=    Evaluate    $conv_meta.get('conversation_id', '')
     Should Not Be Equal    ${conversation_id}    ${EMPTY}    Conversation ID should be set
 
-    # Disconnect WebSocket (triggers conversation close with websocket_disconnect end_reason)
-    ${total_chunks}=    Close Audio Stream    ${stream_id}
-    Log    Closed WebSocket stream, sent ${total_chunks} total chunks
+    # Disconnect WebSocket abruptly without audio-stop (triggers websocket_disconnect end_reason)
+    ${total_chunks}=    Close Audio Stream Without Stop Event    ${stream_id}
+    Log    Closed WebSocket stream abruptly, sent ${total_chunks} total chunks
 
     # Wait for plugin event dispatch (polls every 2s, max 10s)
     ${new_events}=    Wait For Plugin Event    conversation.complete    ${baseline_count}    timeout=10s
diff --git a/tests/libs/audio_stream_library.py b/tests/libs/audio_stream_library.py
index 25399175..e14a174e 100644
--- a/tests/libs/audio_stream_library.py
+++ b/tests/libs/audio_stream_library.py
@@ -136,6 +136,15 @@ def stop_audio_stream(stream_id: str) -> int:
     return _manager.stop_stream(stream_id)
 
 
+def close_audio_stream_without_stop(stream_id: str) -> int:
+    """Close WebSocket connection without sending audio-stop event.
+
+    This simulates abrupt disconnection (network failure, client crash)
+    and should trigger websocket_disconnect end_reason.
+    """
+    return _manager.close_stream_without_stop(stream_id)
+
+
 def cleanup_all_streams():
     """Stop all active streams."""
     _manager.cleanup_all()
diff --git a/tests/resources/queue_keywords.robot b/tests/resources/queue_keywords.robot
index dac88e17..5ba91bf0 100644
--- a/tests/resources/queue_keywords.robot
+++ b/tests/resources/queue_keywords.robot
@@ -334,7 +334,7 @@ Get Job Result
     [Arguments]    ${job_id}
 
     # Get full job details
-    ${response}=    GET On Session    api    /api/queue/job/${job_id}
+    ${response}=    GET On Session    api    /api/queue/jobs/${job_id}
     ...    expected_status=200
 
     ${job_data}=    Set Variable    ${response.json()}
diff --git a/tests/resources/websocket_keywords.robot b/tests/resources/websocket_keywords.robot
index 51dd6f03..f1fbf378 100644
--- a/tests/resources/websocket_keywords.robot
+++ b/tests/resources/websocket_keywords.robot
@@ -132,6 +132,17 @@ Close Audio Stream
     Log    Stopped stream ${stream_id}, total chunks: ${total_chunks}
     RETURN    ${total_chunks}
 
+Close Audio Stream Without Stop Event
+    [Documentation]    Close WebSocket connection without sending audio-stop event.
+    ...                This simulates abrupt disconnection (network failure, client crash)
+    ...                and should trigger websocket_disconnect end_reason.
+    [Arguments]    ${stream_id}
+
+    # Call the Python library method directly
+    ${total_chunks}=    Close Audio Stream Without Stop    ${stream_id}
+    Log    Closed stream ${stream_id} abruptly (no audio-stop), total chunks: ${total_chunks}
+    RETURN    ${total_chunks}
+
 Cleanup All Audio Streams
     [Documentation]    Stop all active streams (use in teardown)
     Cleanup All Streams

From 24a34190c92550dcab2bb5ffff7c305fcd49045c Mon Sep 17 00:00:00 2001
From: Ankush Malaker <43288948+AnkushMalaker@users.noreply.github.com>
Date: Tue, 20 Jan 2026 06:15:35 +0000
Subject: [PATCH 04/14] Enhance Docker command handling and configuration
 management

- Updated `run_compose_command` to support separate build commands for services, including profile management for backend and speaker-recognition services.
- Improved error handling and output streaming during Docker command execution.
- Added `ensure_docker_network` function to verify and create the required Docker network before starting services.
- Refactored configuration files to utilize `oc.env` for environment variable management, ensuring better compatibility and flexibility across different environments.
---
 services.py                       | 224 ++++++++++++++++++------------
 tests/configs/deepgram-openai.yml |  16 +--
 tests/configs/mock-services.yml   |   6 +-
 tests/configs/parakeet-ollama.yml |  12 +-
 tests/configs/parakeet-openai.yml |  12 +-
 5 files changed, 161 insertions(+), 109 deletions(-)

diff --git a/services.py b/services.py
index b4ed44fd..648c3193 100755
--- a/services.py
+++ b/services.py
@@ -80,19 +80,97 @@ def run_compose_command(service_name, command, build=False):
         console.print(f"[red]❌ Docker compose file not found: {compose_file}[/red]")
         return False
 
+    # Step 1: If build is requested, run build separately first (no timeout for CUDA builds)
+    if build and command == 'up':
+        # Build command - need to specify profiles for build too
+        build_cmd = ['docker', 'compose']
+
+        # Add profiles to build command (needed for profile-specific services)
+        if service_name == 'backend':
+            caddyfile_path = service_path / 'Caddyfile'
+            if caddyfile_path.exists() and caddyfile_path.is_file():
+                build_cmd.extend(['--profile', 'https'])
+
+            obsidian_enabled = False
+            config_data = load_config_yml()
+            if config_data:
+                memory_config = config_data.get('memory', {})
+                obsidian_config = memory_config.get('obsidian', {})
+                if obsidian_config.get('enabled', False):
+                    obsidian_enabled = True
+
+            if not obsidian_enabled:
+                env_file = service_path / '.env'
+                if env_file.exists():
+                    env_values = dotenv_values(env_file)
+                    if env_values.get('OBSIDIAN_ENABLED', 'false').lower() == 'true':
+                        obsidian_enabled = True
+
+            if obsidian_enabled:
+                build_cmd.extend(['--profile', 'obsidian'])
+
+        elif service_name == 'speaker-recognition':
+            env_file = service_path / '.env'
+            if env_file.exists():
+                env_values = dotenv_values(env_file)
+                compute_mode = env_values.get('COMPUTE_MODE', 'cpu')
+                build_cmd.extend(['--profile', compute_mode])
+
+        build_cmd.append('build')
+
+        # Run build with streaming output (no timeout)
+        console.print(f"[cyan]🔨 Building {service_name} (this may take several minutes for CUDA/GPU builds)...[/cyan]")
+        try:
+            process = subprocess.Popen(
+                build_cmd,
+                cwd=service_path,
+                stdout=subprocess.PIPE,
+                stderr=subprocess.STDOUT,
+                text=True,
+                bufsize=1
+            )
+
+            if process.stdout is None:
+                raise RuntimeError("Process stdout is None - unable to read command output")
+
+            for line in process.stdout:
+                line = line.rstrip()
+                if not line:
+                    continue
+
+                if 'error' in line.lower() or 'failed' in line.lower():
+                    console.print(f"  [red]{line}[/red]")
+                elif 'Successfully' in line or 'built' in line.lower():
+                    console.print(f"  [green]{line}[/green]")
+                elif 'Building' in line or 'Step' in line:
+                    console.print(f"  [cyan]{line}[/cyan]")
+                elif 'warning' in line.lower():
+                    console.print(f"  [yellow]{line}[/yellow]")
+                else:
+                    console.print(f"  [dim]{line}[/dim]")
+
+            process.wait()
+
+            if process.returncode != 0:
+                console.print(f"\n[red]❌ Build failed for {service_name}[/red]")
+                return False
+
+            console.print(f"[green]✅ Build completed for {service_name}[/green]")
+
+        except Exception as e:
+            console.print(f"[red]❌ Error building {service_name}: {e}[/red]")
+            return False
+
+    # Step 2: Run the actual command (up/down/restart/status)
     cmd = ['docker', 'compose']
 
-    # For backend service, check if HTTPS is configured (Caddyfile exists)
+    # Add profiles for backend service
     if service_name == 'backend':
         caddyfile_path = service_path / 'Caddyfile'
         if caddyfile_path.exists() and caddyfile_path.is_file():
-            # Enable HTTPS profile to start Caddy service
             cmd.extend(['--profile', 'https'])
 
-        # Check if Obsidian/Neo4j is enabled
         obsidian_enabled = False
-
-        # Method 1: Check config.yml (preferred)
         config_data = load_config_yml()
         if config_data:
             memory_config = config_data.get('memory', {})
@@ -100,7 +178,6 @@ def run_compose_command(service_name, command, build=False):
             if obsidian_config.get('enabled', False):
                 obsidian_enabled = True
 
-        # Method 2: Fallback to .env for backward compatibility
         if not obsidian_enabled:
             env_file = service_path / '.env'
             if env_file.exists():
@@ -114,30 +191,22 @@ def run_compose_command(service_name, command, build=False):
 
     # Handle speaker-recognition service specially
     if service_name == 'speaker-recognition' and command in ['up', 'down']:
-        # Read configuration to determine profile
         env_file = service_path / '.env'
         if env_file.exists():
             env_values = dotenv_values(env_file)
             compute_mode = env_values.get('COMPUTE_MODE', 'cpu')
 
-            # Add profile flag for both up and down commands
-            if compute_mode == 'gpu':
-                cmd.extend(['--profile', 'gpu'])
-            else:
-                cmd.extend(['--profile', 'cpu'])
+            cmd.extend(['--profile', compute_mode])
 
             if command == 'up':
                 https_enabled = env_values.get('REACT_UI_HTTPS', 'false')
                 if https_enabled.lower() == 'true':
-                    # HTTPS mode: start with profile for all services (includes nginx)
                     cmd.extend(['up', '-d'])
                 else:
-                    # HTTP mode: start specific services with profile (no nginx)
                     cmd.extend(['up', '-d', 'speaker-service-gpu' if compute_mode == 'gpu' else 'speaker-service-cpu', 'web-ui'])
             elif command == 'down':
                 cmd.extend(['down'])
         else:
-            # Fallback: no profile
             if command == 'up':
                 cmd.extend(['up', '-d'])
             elif command == 'down':
@@ -152,79 +221,28 @@ def run_compose_command(service_name, command, build=False):
             cmd.extend(['restart'])
         elif command == 'status':
             cmd.extend(['ps'])
-    
-    if command == 'up' and build:
-        cmd.append('--build')
-    
+
     try:
-        # For commands that need real-time output (build), stream to console
-        if build and command == 'up':
-            console.print(f"[dim]Building {service_name} containers...[/dim]")
-            process = subprocess.Popen(
-                cmd,
-                cwd=service_path,
-                stdout=subprocess.PIPE,
-                stderr=subprocess.STDOUT,
-                text=True,
-                bufsize=1
-            )
-            
-            # Simply stream all output with coloring
-            all_output = []
-            
-            if process.stdout is None:
-                raise RuntimeError("Process stdout is None - unable to read command output")
-            for line in process.stdout:
-                line = line.rstrip()
-                if not line:
-                    continue
-                
-                # Store for error context
-                all_output.append(line)
-                
-                # Print with appropriate coloring
-                if 'error' in line.lower() or 'failed' in line.lower():
-                    console.print(f"  [red]{line}[/red]")
-                elif 'Successfully' in line or 'Started' in line or 'Created' in line:
-                    console.print(f"  [green]{line}[/green]")
-                elif 'Building' in line or 'Creating' in line:
-                    console.print(f"  [cyan]{line}[/cyan]")
-                elif 'warning' in line.lower():
-                    console.print(f"  [yellow]{line}[/yellow]")
-                else:
-                    console.print(f"  [dim]{line}[/dim]")
-            
-            # Wait for process to complete
-            process.wait()
-            
-            # If build failed, show error summary
-            if process.returncode != 0:
-                console.print(f"\n[red]❌ Build failed for {service_name}[/red]")
-                return False
-            
+        # Run the command with timeout (build already done if needed)
+        result = subprocess.run(
+            cmd,
+            cwd=service_path,
+            capture_output=True,
+            text=True,
+            check=False,
+            timeout=120  # 2 minute timeout
+        )
+
+        if result.returncode == 0:
             return True
         else:
-            # For non-build commands, run silently unless there's an error
-            result = subprocess.run(
-                cmd,
-                cwd=service_path,
-                capture_output=True,
-                text=True,
-                check=False,
-                timeout=120  # 2 minute timeout for service status checks
-            )
-            
-            if result.returncode == 0:
-                return True
-            else:
-                console.print(f"[red]❌ Command failed[/red]")
-                if result.stderr:
-                    console.print("[red]Error output:[/red]")
-                    # Show all error output
-                    for line in result.stderr.splitlines():
-                        console.print(f"  [dim]{line}[/dim]")
-                return False
-            
+            console.print(f"[red]❌ Command failed[/red]")
+            if result.stderr:
+                console.print("[red]Error output:[/red]")
+                for line in result.stderr.splitlines():
+                    console.print(f"  [dim]{line}[/dim]")
+            return False
+
     except subprocess.TimeoutExpired:
         console.print(f"[red]❌ Command timed out after 2 minutes for {service_name}[/red]")
         return False
@@ -232,10 +250,44 @@ def run_compose_command(service_name, command, build=False):
         console.print(f"[red]❌ Error running command: {e}[/red]")
         return False
 
+def ensure_docker_network():
+    """Ensure chronicle-network exists"""
+    try:
+        # Check if network already exists
+        result = subprocess.run(
+            ['docker', 'network', 'inspect', 'chronicle-network'],
+            capture_output=True,
+            check=False
+        )
+
+        if result.returncode != 0:
+            # Network doesn't exist, create it
+            console.print("[blue]📡 Creating chronicle-network...[/blue]")
+            subprocess.run(
+                ['docker', 'network', 'create', 'chronicle-network'],
+                check=True,
+                capture_output=True
+            )
+            console.print("[green]✅ chronicle-network created[/green]")
+        else:
+            console.print("[dim]📡 chronicle-network already exists[/dim]")
+        return True
+    except subprocess.CalledProcessError as e:
+        console.print(f"[red]❌ Failed to create network: {e}[/red]")
+        return False
+    except Exception as e:
+        console.print(f"[red]❌ Error checking/creating network: {e}[/red]")
+        return False
+
 def start_services(services, build=False):
     """Start specified services"""
     console.print(f"🚀 [bold]Starting {len(services)} services...[/bold]")
-    
+
+    # Ensure Docker network exists before starting services
+    if not ensure_docker_network():
+        console.print("[red]❌ Cannot start services without Docker network[/red]")
+        return
+
     success_count = 0
     for service_name in services:
         if service_name not in SERVICES:
diff --git a/tests/configs/deepgram-openai.yml b/tests/configs/deepgram-openai.yml
index e92bcbc5..e15ec756 100644
--- a/tests/configs/deepgram-openai.yml
+++ b/tests/configs/deepgram-openai.yml
@@ -23,7 +23,7 @@ memory:
   timeout_seconds: 1200
 models:
 - api_family: openai
-  api_key: ${OPENAI_API_KEY:-}
+  api_key: ${oc.env:OPENAI_API_KEY,}
   description: OpenAI GPT-4o-mini
   model_name: gpt-4o-mini
   model_output: json
@@ -35,7 +35,7 @@ models:
   model_url: https://api.openai.com/v1
   name: openai-llm
 - api_family: openai
-  api_key: ${OPENAI_API_KEY:-}
+  api_key: ${oc.env:OPENAI_API_KEY,}
   description: OpenAI text-embedding-3-small
   embedding_dimensions: 1536
   model_name: text-embedding-3-small
@@ -48,14 +48,14 @@ models:
   description: Qdrant vector database
   model_params:
     collection_name: omi_memories
-    host: ${QDRANT_BASE_URL:-qdrant}
-    port: ${QDRANT_PORT:-6333}
+    host: ${oc.env:QDRANT_BASE_URL,qdrant}
+    port: ${oc.env:QDRANT_PORT,6333}
   model_provider: qdrant
   model_type: vector_store
-  model_url: http://${QDRANT_BASE_URL:-qdrant}:${QDRANT_PORT:-6333}
+  model_url: http://${oc.env:QDRANT_BASE_URL,qdrant}:${oc.env:QDRANT_PORT,6333}
   name: vs-qdrant
 - api_family: http
-  api_key: ${DEEPGRAM_API_KEY:-}
+  api_key: ${oc.env:DEEPGRAM_API_KEY,}
   description: Deepgram Nova 3 (batch)
   model_provider: deepgram
   model_type: stt
@@ -64,7 +64,7 @@ models:
   operations:
     stt_transcribe:
       headers:
-        Authorization: Token ${DEEPGRAM_API_KEY:-}
+        Authorization: Token ${oc.env:DEEPGRAM_API_KEY,}
         Content-Type: audio/raw
       method: POST
       path: /listen
@@ -84,7 +84,7 @@ models:
           words: results.channels[0].alternatives[0].words
         type: json
 - api_family: websocket
-  api_key: ${DEEPGRAM_API_KEY:-}
+  api_key: ${oc.env:DEEPGRAM_API_KEY,}
   description: Deepgram Nova 3 (streaming)
   model_provider: deepgram
   model_type: stt_stream
diff --git a/tests/configs/mock-services.yml b/tests/configs/mock-services.yml
index 34359bd4..a86e11c1 100644
--- a/tests/configs/mock-services.yml
+++ b/tests/configs/mock-services.yml
@@ -38,11 +38,11 @@ models:
   description: Qdrant vector database (local)
   model_params:
     collection_name: omi_memories
-    host: ${QDRANT_BASE_URL:-qdrant}
-    port: ${QDRANT_PORT:-6333}
+    host: ${oc.env:QDRANT_BASE_URL,qdrant}
+    port: ${oc.env:QDRANT_PORT,6333}
   model_provider: qdrant
   model_type: vector_store
-  model_url: http://${QDRANT_BASE_URL:-qdrant}:${QDRANT_PORT:-6333}
+  model_url: http://${oc.env:QDRANT_BASE_URL,qdrant}:${oc.env:QDRANT_PORT,6333}
   name: vs-qdrant
 speaker_recognition:
   enabled: false
diff --git a/tests/configs/parakeet-ollama.yml b/tests/configs/parakeet-ollama.yml
index a4ef958d..99dd7362 100644
--- a/tests/configs/parakeet-ollama.yml
+++ b/tests/configs/parakeet-ollama.yml
@@ -15,7 +15,7 @@ models:
     api_family: openai
     model_name: llama3.1:latest
     model_url: http://localhost:11434/v1
-    api_key: ${OPENAI_API_KEY:-ollama}
+    api_key: ${oc.env:OPENAI_API_KEY,ollama}
     model_params:
       temperature: 0.2
       max_tokens: 2000
@@ -28,7 +28,7 @@ models:
     api_family: openai
     model_name: nomic-embed-text:latest
     model_url: http://localhost:11434/v1
-    api_key: ${OPENAI_API_KEY:-ollama}
+    api_key: ${oc.env:OPENAI_API_KEY,ollama}
     embedding_dimensions: 768
     model_output: vector
 
@@ -37,10 +37,10 @@ models:
     model_type: vector_store
     model_provider: qdrant
     api_family: qdrant
-    model_url: http://${QDRANT_BASE_URL:-qdrant}:${QDRANT_PORT:-6333}
+    model_url: http://${oc.env:QDRANT_BASE_URL,qdrant}:${oc.env:QDRANT_PORT,6333}
     model_params:
-      host: ${QDRANT_BASE_URL:-qdrant}
-      port: ${QDRANT_PORT:-6333}
+      host: ${oc.env:QDRANT_BASE_URL,qdrant}
+      port: ${oc.env:QDRANT_PORT,6333}
       collection_name: omi_memories
 
   - name: stt-parakeet-batch
@@ -48,7 +48,7 @@ models:
     model_type: stt
     model_provider: parakeet
     api_family: http
-    model_url: ${PARAKEET_ASR_URL:-http://localhost:8767}
+    model_url: ${oc.env:PARAKEET_ASR_URL,http://localhost:8767}
     api_key: ''
     operations:
       stt_transcribe:
diff --git a/tests/configs/parakeet-openai.yml b/tests/configs/parakeet-openai.yml
index f3147c33..c0d7b40a 100644
--- a/tests/configs/parakeet-openai.yml
+++ b/tests/configs/parakeet-openai.yml
@@ -15,7 +15,7 @@ models:
     api_family: openai
     model_name: gpt-4o-mini
     model_url: https://api.openai.com/v1
-    api_key: ${OPENAI_API_KEY:-}
+    api_key: ${oc.env:OPENAI_API_KEY,}
     model_params:
       temperature: 0.2
       max_tokens: 2000
@@ -28,7 +28,7 @@ models:
     api_family: openai
     model_name: text-embedding-3-small
     model_url: https://api.openai.com/v1
-    api_key: ${OPENAI_API_KEY:-}
+    api_key: ${oc.env:OPENAI_API_KEY,}
     embedding_dimensions: 1536
     model_output: vector
 
@@ -37,10 +37,10 @@ models:
     model_type: vector_store
     model_provider: qdrant
     api_family: qdrant
-    model_url: http://${QDRANT_BASE_URL:-qdrant}:${QDRANT_PORT:-6333}
+    model_url: http://${oc.env:QDRANT_BASE_URL,qdrant}:${oc.env:QDRANT_PORT,6333}
     model_params:
-      host: ${QDRANT_BASE_URL:-qdrant}
-      port: ${QDRANT_PORT:-6333}
+      host: ${oc.env:QDRANT_BASE_URL,qdrant}
+      port: ${oc.env:QDRANT_PORT,6333}
       collection_name: omi_memories
 
   - name: stt-parakeet-batch
@@ -48,7 +48,7 @@ models:
     model_type: stt
     model_provider: parakeet
     api_family: http
-    model_url: ${PARAKEET_ASR_URL:-http://localhost:8767}
+    model_url: ${oc.env:PARAKEET_ASR_URL,http://localhost:8767}
     api_key: ''
     operations:
       stt_transcribe:

From c1b84aecb6f5747cf1f088e9d81c90883b7852c1 Mon Sep 17 00:00:00 2001
From: Ankush Malaker <43288948+AnkushMalaker@users.noreply.github.com>
Date: Tue, 20 Jan 2026 08:39:20 +0000
Subject: [PATCH 05/14] Enhance configuration loading to support custom config
 file paths

- Added support for the CONFIG_FILE environment variable to allow specifying custom configuration files for testing.
- Implemented logic to handle both absolute paths and relative filenames for the configuration file, improving flexibility in configuration management.
---
 backends/advanced/docker-compose-test.yml              | 10 ++++++++--
 .../advanced/src/advanced_omi_backend/config_loader.py |  9 ++++++++-
 2 files changed, 16 insertions(+), 3 deletions(-)

diff --git a/backends/advanced/docker-compose-test.yml b/backends/advanced/docker-compose-test.yml
index c6df21f4..bb2ac530 100644
--- a/backends/advanced/docker-compose-test.yml
+++ b/backends/advanced/docker-compose-test.yml
@@ -18,7 +18,8 @@ services:
       - ./data/test_audio_chunks:/app/audio_chunks
       - ./data/test_debug_dir:/app/debug  # Fixed: mount to /app/debug for plugin database
       - ./data/test_data:/app/data
-      - ../../config:/app/config  # Mount config directory with defaults.yml and config.yml
+      - ../../config:/app/config  # Mount config directory with defaults.yml
+      - ../../tests/configs:/app/test-configs:ro  # Mount test-specific configs
       - ${PLUGINS_CONFIG:-../../tests/config/plugins.test.yml}:/app/config/plugins.yml  # Mount test plugins config to correct location
     environment:
       # Override with test-specific settings
@@ -27,6 +28,8 @@ services:
       - QDRANT_PORT=6333
       - REDIS_URL=redis://redis-test:6379/0
       - DEBUG_DIR=/app/debug  # Fixed: match plugin database mount path
+      # Test configuration file
+      - CONFIG_FILE=${TEST_CONFIG_FILE:-/app/test-configs/deepgram-openai.yml}
       # Import API keys from environment
       - DEEPGRAM_API_KEY=${DEEPGRAM_API_KEY}
       - OPENAI_API_KEY=${OPENAI_API_KEY}
@@ -171,7 +174,8 @@ services:
       - ./data/test_audio_chunks:/app/audio_chunks
       - ./data/test_debug_dir:/app/debug  # Fixed: mount to /app/debug for plugin database
       - ./data/test_data:/app/data
-      - ../../config:/app/config  # Mount config directory with defaults.yml and config.yml
+      - ../../config:/app/config  # Mount config directory with defaults.yml
+      - ../../tests/configs:/app/test-configs:ro  # Mount test-specific configs
       - ${PLUGINS_CONFIG:-../../tests/config/plugins.test.yml}:/app/config/plugins.yml  # Mount test plugins config to correct location
     environment:
       # Same environment as backend
@@ -180,6 +184,8 @@ services:
       - QDRANT_PORT=6333
       - REDIS_URL=redis://redis-test:6379/0
       - DEBUG_DIR=/app/debug  # Fixed: match plugin database mount path
+      # Test configuration file
+      - CONFIG_FILE=${TEST_CONFIG_FILE:-/app/test-configs/deepgram-openai.yml}
       - DEEPGRAM_API_KEY=${DEEPGRAM_API_KEY}
       - OPENAI_API_KEY=${OPENAI_API_KEY}
       - GROQ_API_KEY=${GROQ_API_KEY}
diff --git a/backends/advanced/src/advanced_omi_backend/config_loader.py b/backends/advanced/src/advanced_omi_backend/config_loader.py
index 6b504c79..5d25debd 100644
--- a/backends/advanced/src/advanced_omi_backend/config_loader.py
+++ b/backends/advanced/src/advanced_omi_backend/config_loader.py
@@ -55,7 +55,14 @@ def load_config(force_reload: bool = False) -> DictConfig:
 
     config_dir = get_config_dir()
     defaults_path = config_dir / "defaults.yml"
-    config_path = config_dir / "config.yml"
+
+    # Support CONFIG_FILE env var for test configurations
+    config_file = os.getenv("CONFIG_FILE", "config.yml")
+    # Handle both absolute paths and relative filenames
+    if os.path.isabs(config_file):
+        config_path = Path(config_file)
+    else:
+        config_path = config_dir / config_file
 
     # Load defaults
     defaults = {}

From 3a55ac983424366986cbda8e14710020a06beb56 Mon Sep 17 00:00:00 2001
From: Ankush Malaker <43288948+AnkushMalaker@users.noreply.github.com>
Date: Tue, 20 Jan 2026 08:43:41 +0000
Subject: [PATCH 06/14] Update test scripts to use TEST_CONFIG_FILE for
 configuration management

- Replaced CONFIG_FILE with TEST_CONFIG_FILE in both run-no-api-tests.sh and run-robot-tests.sh to standardize configuration file usage.
- Updated paths to point to mock and deepgram-openai configuration files inside the container, improving clarity and consistency in test setups.
---
 tests/run-no-api-tests.sh | 10 +++-------
 tests/run-robot-tests.sh  | 12 +++---------
 2 files changed, 6 insertions(+), 16 deletions(-)

diff --git a/tests/run-no-api-tests.sh b/tests/run-no-api-tests.sh
index 25d04f97..b5c5a505 100755
--- a/tests/run-no-api-tests.sh
+++ b/tests/run-no-api-tests.sh
@@ -49,14 +49,10 @@ CLEANUP_CONTAINERS="${CLEANUP_CONTAINERS:-false}"
 OUTPUTDIR="${OUTPUTDIR:-results-no-api}"
 
 # Use mock services config (no API keys needed)
-export CONFIG_FILE="${CONFIG_FILE:-configs/mock-services.yml}"
+# Set TEST_CONFIG_FILE to point to mock-services.yml inside the container
+export TEST_CONFIG_FILE="/app/test-configs/mock-services.yml"
 
-# Convert CONFIG_FILE to absolute path
-if [[ ! "$CONFIG_FILE" = /* ]]; then
-    CONFIG_FILE="$(cd "$(dirname "$CONFIG_FILE")" && pwd)/$(basename "$CONFIG_FILE")"
-fi
-
-print_info "Using config file: $CONFIG_FILE"
+print_info "Using config file: ${TEST_CONFIG_FILE}"
 print_warning "Memory extraction and transcription are disabled in this mode"
 
 # Load environment variables if available (but don't require them)
diff --git a/tests/run-robot-tests.sh b/tests/run-robot-tests.sh
index 015b63e0..7f7cd5c4 100755
--- a/tests/run-robot-tests.sh
+++ b/tests/run-robot-tests.sh
@@ -46,15 +46,9 @@ print_info "============================"
 CLEANUP_CONTAINERS="${CLEANUP_CONTAINERS:-false}"  # Changed default: keep containers running for faster re-runs
 OUTPUTDIR="${OUTPUTDIR:-results}"
 
-# Set default CONFIG_FILE if not provided
-# Use test config by default (disables speaker recognition for CI performance)
-# Override: CONFIG_FILE=../config/config.yml ./run-robot-tests.sh
-export CONFIG_FILE="${CONFIG_FILE:-configs/deepgram-openai.yml}"
-
-# Convert CONFIG_FILE to absolute path (Docker Compose resolves relative paths from compose file location)
-if [[ ! "$CONFIG_FILE" = /* ]]; then
-    CONFIG_FILE="$(cd "$(dirname "$CONFIG_FILE")" && pwd)/$(basename "$CONFIG_FILE")"
-fi
+# Use Deepgram + OpenAI config for full API tests
+# Set TEST_CONFIG_FILE to point to deepgram-openai.yml inside the container
+export TEST_CONFIG_FILE="/app/test-configs/deepgram-openai.yml"
 
 # Load environment variables (CI or local)
 if [ -f "setup/.env.test" ] && [ -z "$DEEPGRAM_API_KEY" ]; then

From 157e1c7e8bbc50409417546bc3b49295c1390594 Mon Sep 17 00:00:00 2001
From: Ankush Malaker <43288948+AnkushMalaker@users.noreply.github.com>
Date: Wed, 21 Jan 2026 22:30:58 +0000
Subject: [PATCH 07/14] Refactor audio upload response handling and improve
 error reporting

- Updated `upload_and_process_audio_files` to return appropriate HTTP status codes based on upload results: 400 for all failures, 207 for partial successes, and 200 for complete success.
- Enhanced error messages in the audio upload tests to provide clearer feedback on upload failures, including specific error details for better debugging.
- Adjusted test scripts to ensure consistent handling of conversation IDs in job metadata, improving validation checks for job creation.
---
 .../controllers/audio_controller.py           | 15 ++++-
 .../controllers/queue_controller.py           | 10 +--
 .../controllers/websocket_controller.py       | 41 ++++--------
 .../utils/conversation_utils.py               | 11 +++-
 .../workers/conversation_jobs.py              | 40 ++----------
 .../workers/orchestrator/health_monitor.py    | 64 ++++++++++++++++---
 .../workers/orchestrator/process_manager.py   | 35 ++++++++--
 tests/endpoints/audio_upload_tests.robot      | 20 ++++--
 tests/integration/plugin_event_tests.robot    | 12 ++--
 .../websocket_transcription_e2e_test.robot    | 21 ++++++
 tests/resources/audio_keywords.robot          | 16 ++++-
 tests/resources/conversation_keywords.robot   |  2 +-
 12 files changed, 192 insertions(+), 95 deletions(-)

diff --git a/backends/advanced/src/advanced_omi_backend/controllers/audio_controller.py b/backends/advanced/src/advanced_omi_backend/controllers/audio_controller.py
index a2321d58..223564d2 100644
--- a/backends/advanced/src/advanced_omi_backend/controllers/audio_controller.py
+++ b/backends/advanced/src/advanced_omi_backend/controllers/audio_controller.py
@@ -237,7 +237,7 @@ async def upload_and_process_audio_files(
         successful_files = [f for f in processed_files if f.get("status") == "started"]
         failed_files = [f for f in processed_files if f.get("status") == "error"]
 
-        return {
+        response_body = {
             "message": f"Uploaded and processing {len(successful_files)} file(s)",
             "client_id": client_id,
             "files": processed_files,
@@ -248,6 +248,19 @@ async def upload_and_process_audio_files(
             },
         }
 
+        # Return appropriate HTTP status code based on results
+        if len(failed_files) == len(files):
+            # ALL files failed - return 400 Bad Request
+            audio_logger.error(f"All {len(files)} file(s) failed to upload")
+            return JSONResponse(status_code=400, content=response_body)
+        elif len(failed_files) > 0:
+            # SOME files failed (partial success) - return 207 Multi-Status
+            audio_logger.warning(f"Partial upload: {len(successful_files)} succeeded, {len(failed_files)} failed")
+            return JSONResponse(status_code=207, content=response_body)
+        else:
+            # All files succeeded - return 200 OK
+            return response_body
+
     except (OSError, IOError) as e:
         # File system errors during upload handling
         audio_logger.exception("File I/O error in upload_and_process_audio_files")
diff --git a/backends/advanced/src/advanced_omi_backend/controllers/queue_controller.py b/backends/advanced/src/advanced_omi_backend/controllers/queue_controller.py
index 17a4899d..0ea739d4 100644
--- a/backends/advanced/src/advanced_omi_backend/controllers/queue_controller.py
+++ b/backends/advanced/src/advanced_omi_backend/controllers/queue_controller.py
@@ -415,7 +415,8 @@ def start_post_conversation_jobs(
     user_id: str,
     transcript_version_id: Optional[str] = None,
     depends_on_job = None,
-    client_id: Optional[str] = None
+    client_id: Optional[str] = None,
+    end_reason: str = "file_upload"
 ) -> Dict[str, str]:
     """
     Start post-conversation processing jobs after conversation is created.
@@ -435,6 +436,7 @@ def start_post_conversation_jobs(
         transcript_version_id: Transcript version ID (auto-generated if None)
         depends_on_job: Optional job dependency for first job (e.g., transcription for file uploads)
         client_id: Client ID for UI tracking
+        end_reason: Reason conversation ended (e.g., 'file_upload', 'websocket_disconnect', 'user_stopped')
 
     Returns:
         Dict with job IDs for speaker_recognition, memory, title_summary, event_dispatch
@@ -537,18 +539,18 @@ def start_post_conversation_jobs(
         conversation_id,
         client_id or "",
         user_id,
-        "file_upload",  # Explicit end_reason for file upload processing
+        end_reason,  # Use the end_reason parameter (defaults to 'file_upload' for backward compatibility)
         job_timeout=120,  # 2 minutes
         result_ttl=JOB_RESULT_TTL,
         depends_on=[memory_job, title_summary_job],  # Wait for both parallel jobs
         job_id=event_job_id,
-        description=f"Dispatch conversation complete event for {conversation_id[:8]}",
+        description=f"Dispatch conversation complete event ({end_reason}) for {conversation_id[:8]}",
         meta=job_meta
     )
     logger.info(f"📥 RQ: Enqueued conversation complete event job {event_dispatch_job.id}, meta={event_dispatch_job.meta} (depends on {memory_job.id} and {title_summary_job.id})")
 
     return {
-        'speaker_recognition': speaker_job.id,
+        'speaker_recognition': speaker_job.id if speaker_job else None,
         'memory': memory_job.id,
         'title_summary': title_summary_job.id,
         'event_dispatch': event_dispatch_job.id
diff --git a/backends/advanced/src/advanced_omi_backend/controllers/websocket_controller.py b/backends/advanced/src/advanced_omi_backend/controllers/websocket_controller.py
index fa5b23b2..8cd3319b 100644
--- a/backends/advanced/src/advanced_omi_backend/controllers/websocket_controller.py
+++ b/backends/advanced/src/advanced_omi_backend/controllers/websocket_controller.py
@@ -202,35 +202,22 @@ async def create_client_state(client_id: str, user, device_name: Optional[str] =
 
 
 async def cleanup_client_state(client_id: str):
-    """Clean up and remove client state, including cancelling speech detection job and marking session complete."""
-    # Cancel the speech detection job for this client
-    from advanced_omi_backend.controllers.queue_controller import redis_conn
-    from rq.job import Job
+    """
+    Clean up and remove client state, marking session complete.
+
+    Note: We do NOT cancel the speech detection job here because:
+    1. The job needs to process all audio data that was already sent
+    2. If speech was detected, it should create a conversation
+    3. The job will complete naturally when it sees session status = "finalizing"
+    4. The job has a grace period (15s) to wait for final transcription
+    5. RQ's job_timeout (24h) prevents jobs from hanging forever
+    """
+    # Note: Previously we cancelled the speech detection job here, but this prevented
+    # conversations from being created when WebSocket disconnects mid-recording.
+    # The speech detection job now monitors session status and completes naturally.
     import redis.asyncio as redis
 
-    try:
-        job_id_key = f"speech_detection_job:{client_id}"
-        job_id_bytes = redis_conn.get(job_id_key)
-
-        if job_id_bytes:
-            job_id = job_id_bytes.decode()
-            logger.info(f"🛑 Cancelling speech detection job {job_id} for client {client_id}")
-
-            try:
-                # Fetch and cancel the job
-                job = Job.fetch(job_id, connection=redis_conn)
-                job.cancel()
-                logger.info(f"✅ Successfully cancelled speech detection job {job_id}")
-            except Exception as job_error:
-                logger.warning(f"⚠️ Failed to cancel job {job_id}: {job_error}")
-
-            # Clean up the tracking key
-            redis_conn.delete(job_id_key)
-            logger.info(f"🧹 Cleaned up job tracking key for client {client_id}")
-        else:
-            logger.debug(f"No speech detection job found for client {client_id}")
-    except Exception as e:
-        logger.warning(f"⚠️ Error during job cancellation for client {client_id}: {e}")
+    logger.info(f"🔄 Letting speech detection job complete naturally for client {client_id} (if running)")
 
     # Mark all active sessions for this client as complete AND delete Redis streams
     try:
diff --git a/backends/advanced/src/advanced_omi_backend/utils/conversation_utils.py b/backends/advanced/src/advanced_omi_backend/utils/conversation_utils.py
index 03f75dc3..27af4bfa 100644
--- a/backends/advanced/src/advanced_omi_backend/utils/conversation_utils.py
+++ b/backends/advanced/src/advanced_omi_backend/utils/conversation_utils.py
@@ -525,6 +525,15 @@ async def update_job_progress_metadata(
     if "created_at" not in current_job.meta:
         current_job.meta["created_at"] = datetime.now().isoformat()
 
+    # Calculate inactivity based on audio-relative timestamps
+    # Both current_audio_time and last_meaningful_speech_time are seconds into the audio stream
+    current_audio_time = speech_analysis.get("speech_end", 0.0)
+    inactivity_seconds = (
+        current_audio_time - last_meaningful_speech_time
+        if current_audio_time > 0 and last_meaningful_speech_time > 0
+        else 0
+    )
+
     current_job.meta.update(
         {
             "conversation_id": conversation_id,
@@ -538,7 +547,7 @@ async def update_job_progress_metadata(
             "duration_seconds": speech_analysis.get("duration", 0),
             "has_speech": speech_analysis.get("has_speech", False),
             "last_update": datetime.now().isoformat(),
-            "inactivity_seconds": time.time() - last_meaningful_speech_time,
+            "inactivity_seconds": inactivity_seconds,
             "chunks_processed": combined["chunk_count"],
         }
     )
diff --git a/backends/advanced/src/advanced_omi_backend/workers/conversation_jobs.py b/backends/advanced/src/advanced_omi_backend/workers/conversation_jobs.py
index 26b820a6..beaabbef 100644
--- a/backends/advanced/src/advanced_omi_backend/workers/conversation_jobs.py
+++ b/backends/advanced/src/advanced_omi_backend/workers/conversation_jobs.py
@@ -674,7 +674,8 @@ async def open_conversation_job(
         conversation_id=conversation_id,
         user_id=user_id,
         transcript_version_id=version_id,  # Pass the streaming transcript version ID
-        client_id=client_id  # Pass client_id for UI tracking
+        client_id=client_id,  # Pass client_id for UI tracking
+        end_reason=end_reason  # Pass the determined end_reason (websocket_disconnect, inactivity_timeout, etc.)
     )
 
     logger.info(
@@ -686,38 +687,11 @@ async def open_conversation_job(
     # Wait a moment to ensure jobs are registered in RQ
     await asyncio.sleep(0.5)
 
-    # Enqueue conversation.complete event dispatch job
-    # This unifies the dispatch path for both WebSocket and file upload processing
-    try:
-        from rq import Queue
-
-        default_queue = Queue('default', connection=redis_conn)
-
-        dispatch_job = default_queue.enqueue(
-            dispatch_conversation_complete_event_job,
-            conversation_id,
-            client_id,
-            user_id,
-            end_reason,  # Pass the end_reason we determined earlier
-            job_timeout=120,
-            result_ttl=600,
-            job_id=f"event_complete_{conversation_id[:12]}",
-            description=f"Dispatch conversation complete event ({end_reason})",
-            meta={"client_id": client_id}
-        )
-
-        logger.info(
-            f"📥 Enqueued conversation.complete dispatch job {dispatch_job.id} "
-            f"for {conversation_id[:12]} (end_reason={end_reason})"
-        )
-
-    except Exception as e:
-        logger.error(
-            f"❌ Failed to enqueue conversation.complete dispatch job "
-            f"for {conversation_id[:12]}: {e}",
-            exc_info=True
-        )
-        # Don't fail the entire job - conversation is saved, just plugins won't be notified
+    # Note: conversation.complete event dispatch job is already enqueued by start_post_conversation_jobs
+    # It runs after memory and title/summary jobs complete, ensuring all data is ready
+    logger.info(
+        f"✅ Post-conversation pipeline started with event dispatch job (end_reason={end_reason})"
+    )
 
     # Call shared cleanup/restart logic
     return await handle_end_of_conversation(
diff --git a/backends/advanced/src/advanced_omi_backend/workers/orchestrator/health_monitor.py b/backends/advanced/src/advanced_omi_backend/workers/orchestrator/health_monitor.py
index 9b1149e2..310999c6 100644
--- a/backends/advanced/src/advanced_omi_backend/workers/orchestrator/health_monitor.py
+++ b/backends/advanced/src/advanced_omi_backend/workers/orchestrator/health_monitor.py
@@ -236,7 +236,7 @@ def _handle_registration_loss(self):
             "(replicating old start-workers.sh behavior)"
         )
 
-        # Restart all RQ workers
+        # Restart all RQ workers (this method now handles timestamp update internally)
         success = self._restart_all_rq_workers()
 
         if success:
@@ -244,12 +244,9 @@ def _handle_registration_loss(self):
         else:
             logger.error("❌ Bulk restart encountered errors - check individual worker logs")
 
-        # Update recovery timestamp to start cooldown
-        self.last_registration_recovery = current_time
-
     def _restart_all_rq_workers(self) -> bool:
         """
-        Restart all RQ workers (bulk restart).
+        Restart all RQ workers (bulk restart) with timing measurements.
 
         This matches the old bash script's recovery mechanism:
         - Kill all RQ workers
@@ -269,19 +266,66 @@ def _restart_all_rq_workers(self) -> bool:
             logger.warning("No RQ workers found to restart")
             return False
 
-        logger.info(f"Restarting {len(rq_workers)} RQ workers...")
+        # START TIMING
+        bulk_restart_start = time.time()
+        logger.warning(
+            f"⚠️  RQ worker registration lost! "
+            f"Starting bulk restart of {len(rq_workers)} workers at {time.strftime('%H:%M:%S')}"
+        )
 
         all_success = True
-        for worker in rq_workers:
-            logger.info(f"  ↻ Restarting {worker.name}...")
+        worker_times = []  # Track individual worker restart times
+
+        for i, worker in enumerate(rq_workers, 1):
+            worker_start = time.time()
+            logger.info(
+                f"  [{i}/{len(rq_workers)}] ↻ Restarting {worker.name} at {time.strftime('%H:%M:%S')}..."
+            )
+
             success = self.process_manager.restart_worker(worker.name)
 
+            worker_duration = time.time() - worker_start
+            worker_times.append((worker.name, worker_duration))
+
             if success:
-                logger.info(f"  ✓ {worker.name} restarted successfully")
+                logger.info(
+                    f"  [{i}/{len(rq_workers)}] ✓ {worker.name} restarted in {worker_duration:.2f}s"
+                )
             else:
-                logger.error(f"  ✗ {worker.name} restart failed")
+                logger.error(
+                    f"  [{i}/{len(rq_workers)}] ✗ {worker.name} restart failed after {worker_duration:.2f}s"
+                )
                 all_success = False
 
+        # END TIMING
+        total_duration = time.time() - bulk_restart_start
+
+        # Log timing summary
+        logger.info(f"\n⏱️  Bulk Restart Timing Summary:")
+        logger.info(f"  Total workers: {len(rq_workers)}")
+        logger.info(
+            f"  Total time: {total_duration:.2f}s ({total_duration/60:.1f} minutes)"
+        )
+        logger.info(f"  Average per worker: {total_duration/len(rq_workers):.2f}s")
+
+        if worker_times:
+            slowest = max(worker_times, key=lambda x: x[1])
+            fastest = min(worker_times, key=lambda x: x[1])
+            logger.info(f"  Slowest worker: {slowest[0]} ({slowest[1]:.2f}s)")
+            logger.info(f"  Fastest worker: {fastest[0]} ({fastest[1]:.2f}s)")
+
+        # Update recovery timestamp (moved here from _handle_registration_loss)
+        self.last_registration_recovery = time.time()
+
+        if all_success:
+            logger.info(
+                f"✅ Successfully restarted all {len(rq_workers)} RQ workers in {total_duration:.2f}s"
+            )
+        else:
+            logger.warning(
+                f"⚠️  Some workers failed to restart (took {total_duration:.2f}s total)"
+            )
+
         return all_success
 
     def get_health_status(self) -> dict:
diff --git a/backends/advanced/src/advanced_omi_backend/workers/orchestrator/process_manager.py b/backends/advanced/src/advanced_omi_backend/workers/orchestrator/process_manager.py
index 21b7f23e..5448b96f 100644
--- a/backends/advanced/src/advanced_omi_backend/workers/orchestrator/process_manager.py
+++ b/backends/advanced/src/advanced_omi_backend/workers/orchestrator/process_manager.py
@@ -240,7 +240,7 @@ def stop_all(self, timeout: int = 30) -> bool:
 
     def restart_worker(self, name: str, timeout: int = 30) -> bool:
         """
-        Restart a specific worker.
+        Restart a specific worker with timing measurements.
 
         Args:
             name: Worker name
@@ -254,23 +254,44 @@ def restart_worker(self, name: str, timeout: int = 30) -> bool:
             logger.error(f"Worker '{name}' not found")
             return False
 
-        logger.info(f"Restarting worker: {name}")
+        restart_start = time.time()
+        logger.info(f"{name}: Starting restart at {time.strftime('%H:%M:%S')}")
 
-        # Ensure worker is fully stopped before attempting restart
+        # STOP phase with timing
+        stop_start = time.time()
         stop_success = worker.stop(timeout=timeout)
+        stop_duration = time.time() - stop_start
+
         if not stop_success:
-            logger.error(f"{name}: Failed to stop cleanly, restart aborted")
+            logger.error(
+                f"{name}: Failed to stop cleanly after {stop_duration:.2f}s "
+                f"(timeout was {timeout}s), restart aborted"
+            )
             worker.state = WorkerState.FAILED
             return False
 
-        # Attempt to start the worker
+        logger.info(
+            f"{name}: Stopped in {stop_duration:.2f}s (timeout was {timeout}s)"
+        )
+
+        # START phase with timing
+        start_start = time.time()
         success = worker.start()
+        start_duration = time.time() - start_start
+
+        total_restart_time = time.time() - restart_start
 
         if success:
             worker.restart_count += 1
-            logger.info(f"{name}: Restart #{worker.restart_count} successful")
+            logger.info(
+                f"{name}: Restart #{worker.restart_count} successful "
+                f"(stop: {stop_duration:.2f}s, start: {start_duration:.2f}s, total: {total_restart_time:.2f}s)"
+            )
         else:
-            logger.error(f"{name}: Restart failed")
+            logger.error(
+                f"{name}: Restart failed after {total_restart_time:.2f}s "
+                f"(stop: {stop_duration:.2f}s, start attempt: {start_duration:.2f}s)"
+            )
 
         return success
 
diff --git a/tests/endpoints/audio_upload_tests.robot b/tests/endpoints/audio_upload_tests.robot
index 7290f150..c4e8fc21 100644
--- a/tests/endpoints/audio_upload_tests.robot
+++ b/tests/endpoints/audio_upload_tests.robot
@@ -188,17 +188,27 @@ Audio Upload Client ID Generation Test
     Should Contain    ${client_id1}    ${device_name}    msg=Client ID should contain device name
     Should Match Regexp    ${client_id1}    ^[a-f0-9]{6}-${device_name}$    msg=Client ID should match format
 
-    # Verify conversation_id is in all job metadata (transcription, speaker, memory jobs)
+    # Verify conversation_id is in job metadata for all created jobs
+    # Note: Speaker job is only created if speaker recognition is enabled in config
+
+    # 1. Transcription job (always created)
     ${transcribe_job}=    Get Job Details    transcribe_${conversation_id1[:12]}
     ${transcribe_meta}=    Set Variable    ${transcribe_job}[meta]
     Dictionary Should Contain Key    ${transcribe_meta}    conversation_id    msg=Transcription job should have conversation_id in meta
     Should Be Equal    ${transcribe_meta}[conversation_id]    ${conversation_id1}    msg=Transcription job meta conversation_id should match
 
+    # 2. Speaker job (conditional - only if speaker recognition enabled)
     ${speaker_job}=    Get Job Details    speaker_${conversation_id1[:12]}
-    ${speaker_meta}=    Set Variable    ${speaker_job}[meta]
-    Dictionary Should Contain Key    ${speaker_meta}    conversation_id    msg=Speaker job should have conversation_id in meta
-    Should Be Equal    ${speaker_meta}[conversation_id]    ${conversation_id1}    msg=Speaker job meta conversation_id should match
+    IF    ${speaker_job} != ${None}
+        ${speaker_meta}=    Set Variable    ${speaker_job}[meta]
+        Dictionary Should Contain Key    ${speaker_meta}    conversation_id    msg=Speaker job should have conversation_id in meta
+        Should Be Equal    ${speaker_meta}[conversation_id]    ${conversation_id1}    msg=Speaker job meta conversation_id should match
+        Log To Console    ✅ Speaker job metadata verified
+    ELSE
+        Log To Console    Speaker recognition disabled - skipping speaker job check
+    END
 
+    # 3. Memory job (always created if memory extraction enabled)
     ${memory_job}=    Get Job Details    memory_${conversation_id1[:12]}
     ${memory_meta}=    Set Variable    ${memory_job}[meta]
     Dictionary Should Contain Key    ${memory_meta}    conversation_id    msg=Memory job should have conversation_id in meta
@@ -213,7 +223,7 @@ Audio Upload Client ID Generation Test
 
     Log To Console    ✅ Client ID generation verified
     Log To Console    🆔 Client ID: ${client_id1}
-    Log To Console    ✅ conversation_id in job metadata verified
+    Log To Console    ✅ conversation_id in job metadata verified (transcription + memory jobs)
 
 
 Audio Upload Job Tracking Test
diff --git a/tests/integration/plugin_event_tests.robot b/tests/integration/plugin_event_tests.robot
index f78649ad..35dd77ef 100644
--- a/tests/integration/plugin_event_tests.robot
+++ b/tests/integration/plugin_event_tests.robot
@@ -164,8 +164,9 @@ WebSocket Disconnect Should Trigger Conversation Complete Event
     ${total_chunks}=    Close Audio Stream Without Stop Event    ${stream_id}
     Log    Closed WebSocket stream abruptly, sent ${total_chunks} total chunks
 
-    # Wait for plugin event dispatch (polls every 2s, max 10s)
-    ${new_events}=    Wait For Plugin Event    conversation.complete    ${baseline_count}    timeout=10s
+    # Wait for plugin event dispatch (polls every 2s, max 30s)
+    # Event dispatch depends on memory and title/summary jobs completing (~20-25s total)
+    ${new_events}=    Wait For Plugin Event    conversation.complete    ${baseline_count}    timeout=30s
 
     Should Be True    ${new_events} > 0
     ...    msg=At least one conversation.complete event should be logged
@@ -174,9 +175,12 @@ WebSocket Disconnect Should Trigger Conversation Complete Event
     Verify Event Metadata    conversation.complete    end_reason    websocket_disconnect    ${conversation_id}
 
     # Verify conversation has end_reason set in database
+    # Wait for end_reason to be persisted (open_conversation_job saves it at the end)
+    Wait Until Keyword Succeeds    10s    1s
+    ...    Conversation Should Have End Reason    ${conversation_id}    websocket_disconnect
+
+    # Verify completed_at timestamp is set
     ${updated_conversation}=    Get Conversation By ID    ${conversation_id}
-    Should Be Equal    ${updated_conversation}[end_reason]    websocket_disconnect
-    ...    msg=Conversation should have websocket_disconnect end_reason
     Should Not Be Equal    ${updated_conversation}[completed_at]    ${None}
     ...    msg=Conversation should have completed_at timestamp
 
diff --git a/tests/integration/websocket_transcription_e2e_test.robot b/tests/integration/websocket_transcription_e2e_test.robot
index d45cec26..7b29a06d 100644
--- a/tests/integration/websocket_transcription_e2e_test.robot
+++ b/tests/integration/websocket_transcription_e2e_test.robot
@@ -123,6 +123,27 @@ Conversation Created With Valid Transcript
     Send Audio Chunks To Stream    ${stream_id}    ${TEST_AUDIO_FILE}    num_chunks=200
     Close Audio Stream    ${stream_id}
 
+    # DIAGNOSTIC: Verify speech detection job completes before checking for conversation
+    Log    Waiting for speech detection job to complete...
+    ${speech_jobs}=    Wait Until Keyword Succeeds    30s    3s
+    ...    Get Jobs By Type And Client    speech_detection    ${client_id}
+
+    Should Not Be Empty    ${speech_jobs}    No speech detection job found
+    ${speech_job}=    Set Variable    ${speech_jobs}[0]
+    ${speech_job_id}=    Set Variable    ${speech_job}[job_id]
+
+    # Wait for speech detection to finish
+    Wait For Job Status    ${speech_job_id}    finished    timeout=30s    interval=2s
+
+    # Verify speech was detected (not no_speech_detected)
+    ${speech_result}=    Get Job Result    ${speech_job_id}
+    Should Not Contain    ${speech_result}    no_speech_detected
+    ...    Speech detection failed with no_speech_detected - transcript may be empty or insufficient
+    Should Contain    ${speech_result}    conversation_job_id
+    ...    Speech detection did not create conversation_job_id
+
+    Log    ✅ Speech detection completed successfully, conversation job should exist
+
     # Wait for conversation to be created
     ${conv_jobs}=    Wait Until Keyword Succeeds    60s    3s
     ...    Job Type Exists For Client    open_conversation    ${client_id}
diff --git a/tests/resources/audio_keywords.robot b/tests/resources/audio_keywords.robot
index 2baf48e9..d2b8ac81 100644
--- a/tests/resources/audio_keywords.robot
+++ b/tests/resources/audio_keywords.robot
@@ -43,9 +43,21 @@ Upload Audio File
       ${upload_response}=    Set Variable    ${response.json()}
       Log    Parsed upload response: ${upload_response}
 
-      # Validate upload was successful
+      # Check HTTP status code first - fail immediately with clear error message
+      IF    ${response.status_code} == 400
+          ${error_msg}=    Set Variable    ${upload_response['files'][0]['error']}
+          Fail    Upload failed (HTTP 400): All files failed - ${error_msg}
+      END
+
+      IF    ${response.status_code} == 207
+          ${error_msg}=    Set Variable    Partial upload failure - check logs
+          Log    WARN: Partial upload (HTTP 207): ${upload_response['summary']['failed']} of ${upload_response['summary']['total']} files failed
+          # Continue anyway since some files succeeded
+      END
+
+      # Validate upload was successful (should be 200 or 207 at this point)
       Should Be Equal As Strings    ${upload_response['summary']['started']}    1    Upload failed: No files enqueued
-      Should Be Equal As Strings    ${upload_response['files'][0]['status']}    started    Upload failed: ${response.text}
+      Should Be Equal As Strings    ${upload_response['files'][0]['status']}    started    Upload failed: ${upload_response['files'][0].get('error', 'Unknown error')}
 
       # Extract important values
       ${job_id}=        Set Variable    ${upload_response['files'][0]['conversation_id']}
diff --git a/tests/resources/conversation_keywords.robot b/tests/resources/conversation_keywords.robot
index 26d80739..5aea9aee 100644
--- a/tests/resources/conversation_keywords.robot
+++ b/tests/resources/conversation_keywords.robot
@@ -19,7 +19,7 @@ Get User Conversations
 Get Conversation By ID
     [Documentation]    Get a specific conversation by ID
     [Arguments]       ${conversation_id}
-    ${response}=    GET On Session    api    /api/conversations/${conversation_id} 
+    ${response}=    GET On Session    api    /api/conversations/${conversation_id}
     RETURN    ${response.json()}[conversation]
 
 Get Conversation Versions

From f08fbc422f16697bea0892a5903a617a543a7871 Mon Sep 17 00:00:00 2001
From: Ankush Malaker <43288948+AnkushMalaker@users.noreply.github.com>
Date: Thu, 22 Jan 2026 17:08:45 +0000
Subject: [PATCH 08/14] Refactor audio processing and job handling to improve
 transcription management

- Updated `upload_and_process_audio_files` to check for transcription provider availability before enqueueing jobs, enhancing error handling and logging.
- Modified `start_post_conversation_jobs` to conditionally enqueue memory extraction jobs based on configuration, improving flexibility in job management.
- Enhanced event dispatch job dependencies to only include jobs that were actually enqueued, ensuring accurate job tracking.
- Added `is_transcription_available` function to check transcription provider status, improving modularity and clarity in the transcription workflow.
---
 .../controllers/audio_controller.py           | 66 ++++++++++-------
 .../controllers/queue_controller.py           | 71 ++++++++++++-------
 .../services/transcription/__init__.py        | 14 ++++
 tests/Makefile                                | 28 +++++++-
 4 files changed, 128 insertions(+), 51 deletions(-)

diff --git a/backends/advanced/src/advanced_omi_backend/controllers/audio_controller.py b/backends/advanced/src/advanced_omi_backend/controllers/audio_controller.py
index 223564d2..734df6ed 100644
--- a/backends/advanced/src/advanced_omi_backend/controllers/audio_controller.py
+++ b/backends/advanced/src/advanced_omi_backend/controllers/audio_controller.py
@@ -14,13 +14,22 @@
 from fastapi import UploadFile
 from fastapi.responses import JSONResponse
 
+from advanced_omi_backend.controllers.queue_controller import (
+    JOB_RESULT_TTL,
+    start_post_conversation_jobs,
+    transcription_queue,
+)
 from advanced_omi_backend.models.conversation import create_conversation
 from advanced_omi_backend.models.user import User
+from advanced_omi_backend.services.transcription import is_transcription_available
 from advanced_omi_backend.utils.audio_chunk_utils import convert_audio_to_chunks
 from advanced_omi_backend.utils.audio_utils import (
     AudioValidationError,
     validate_and_prepare_audio,
 )
+from advanced_omi_backend.workers.transcription_jobs import (
+    transcribe_full_audio_job,
+)
 
 logger = logging.getLogger(__name__)
 audio_logger = logging.getLogger("audio_processing")
@@ -167,38 +176,36 @@ async def upload_and_process_audio_files(
                     continue
 
                 # Enqueue batch transcription job first (file uploads need transcription)
-                from advanced_omi_backend.controllers.queue_controller import (
-                    JOB_RESULT_TTL,
-                    start_post_conversation_jobs,
-                    transcription_queue,
-                )
-                from advanced_omi_backend.workers.transcription_jobs import (
-                    transcribe_full_audio_job,
-                )
-
                 version_id = str(uuid.uuid4())
                 transcribe_job_id = f"transcribe_{conversation_id[:12]}"
 
-                transcription_job = transcription_queue.enqueue(
-                    transcribe_full_audio_job,
-                    conversation_id,
-                    version_id,
-                    "batch",  # trigger
-                    job_timeout=1800,  # 30 minutes
-                    result_ttl=JOB_RESULT_TTL,
-                    job_id=transcribe_job_id,
-                    description=f"Transcribe uploaded file {conversation_id[:8]}",
-                    meta={'conversation_id': conversation_id, 'client_id': client_id}
-                )
-
-                audio_logger.info(f"📥 Enqueued transcription job {transcription_job.id} for uploaded file")
+                # Check if transcription provider is available before enqueueing
+                transcription_job = None
+                if is_transcription_available(mode="batch"):
+                    transcription_job = transcription_queue.enqueue(
+                        transcribe_full_audio_job,
+                        conversation_id,
+                        version_id,
+                        "batch",  # trigger
+                        job_timeout=1800,  # 30 minutes
+                        result_ttl=JOB_RESULT_TTL,
+                        job_id=transcribe_job_id,
+                        description=f"Transcribe uploaded file {conversation_id[:8]}",
+                        meta={'conversation_id': conversation_id, 'client_id': client_id}
+                    )
+                    audio_logger.info(f"📥 Enqueued transcription job {transcription_job.id} for uploaded file")
+                else:
+                    audio_logger.warning(
+                        f"⚠️ Skipping transcription for conversation {conversation_id}: "
+                        "No transcription provider configured"
+                    )
 
                 # Enqueue post-conversation processing job chain (depends on transcription)
                 job_ids = start_post_conversation_jobs(
                     conversation_id=conversation_id,
                     user_id=user.user_id,
                     transcript_version_id=version_id,  # Pass the version_id from transcription job
-                    depends_on_job=transcription_job,  # Wait for transcription to complete
+                    depends_on_job=transcription_job,  # Wait for transcription to complete (or None)
                     client_id=client_id  # Pass client_id for UI tracking
                 )
 
@@ -206,15 +213,24 @@ async def upload_and_process_audio_files(
                     "filename": file.filename,
                     "status": "started",  # RQ standard: job has been enqueued
                     "conversation_id": conversation_id,
-                    "transcript_job_id": transcription_job.id,
+                    "transcript_job_id": transcription_job.id if transcription_job else None,
                     "speaker_job_id": job_ids['speaker_recognition'],
                     "memory_job_id": job_ids['memory'],
                     "duration_seconds": round(duration, 2),
                 })
 
+                # Build job chain description
+                job_chain = []
+                if transcription_job:
+                    job_chain.append(transcription_job.id)
+                if job_ids['speaker_recognition']:
+                    job_chain.append(job_ids['speaker_recognition'])
+                if job_ids['memory']:
+                    job_chain.append(job_ids['memory'])
+
                 audio_logger.info(
                     f"✅ Processed {file.filename} → conversation {conversation_id}, "
-                    f"jobs: {transcription_job.id} → {job_ids['speaker_recognition']} → {job_ids['memory']}"
+                    f"jobs: {' → '.join(job_chain) if job_chain else 'none'}"
                 )
 
             except (OSError, IOError) as e:
diff --git a/backends/advanced/src/advanced_omi_backend/controllers/queue_controller.py b/backends/advanced/src/advanced_omi_backend/controllers/queue_controller.py
index 0ea739d4..70b9b336 100644
--- a/backends/advanced/src/advanced_omi_backend/controllers/queue_controller.py
+++ b/backends/advanced/src/advanced_omi_backend/controllers/queue_controller.py
@@ -483,27 +483,35 @@ def start_post_conversation_jobs(
     else:
         logger.info(f"⏭️  Speaker recognition disabled, skipping speaker job for conversation {conversation_id[:8]}")
 
-    # Step 2: Memory extraction job
-    # Depends on speaker job if it was created, otherwise depends on upstream (transcription or nothing)
-    memory_job_id = f"memory_{conversation_id[:12]}"
-    logger.info(f"🔍 DEBUG: Creating memory job with job_id={memory_job_id}, conversation_id={conversation_id[:12]}")
-
-    memory_job = memory_queue.enqueue(
-        process_memory_job,
-        conversation_id,
-        job_timeout=900,  # 15 minutes
-        result_ttl=JOB_RESULT_TTL,
-        depends_on=speaker_dependency,  # Either speaker_job or upstream dependency
-        job_id=memory_job_id,
-        description=f"Memory extraction for conversation {conversation_id[:8]}",
-        meta=job_meta
-    )
-    if speaker_job:
-        logger.info(f"📥 RQ: Enqueued memory extraction job {memory_job.id}, meta={memory_job.meta} (depends on speaker job {speaker_job.id})")
-    elif depends_on_job:
-        logger.info(f"📥 RQ: Enqueued memory extraction job {memory_job.id}, meta={memory_job.meta} (depends on {depends_on_job.id})")
+    # Step 2: Memory extraction job (conditional - only if enabled)
+    # Check if memory extraction is enabled
+    memory_config = get_service_config('memory.extraction')
+    memory_enabled = memory_config.get('enabled', True)  # Default to True for backward compatibility
+
+    memory_job = None
+    if memory_enabled:
+        # Depends on speaker job if it was created, otherwise depends on upstream (transcription or nothing)
+        memory_job_id = f"memory_{conversation_id[:12]}"
+        logger.info(f"🔍 DEBUG: Creating memory job with job_id={memory_job_id}, conversation_id={conversation_id[:12]}")
+
+        memory_job = memory_queue.enqueue(
+            process_memory_job,
+            conversation_id,
+            job_timeout=900,  # 15 minutes
+            result_ttl=JOB_RESULT_TTL,
+            depends_on=speaker_dependency,  # Either speaker_job or upstream dependency
+            job_id=memory_job_id,
+            description=f"Memory extraction for conversation {conversation_id[:8]}",
+            meta=job_meta
+        )
+        if speaker_job:
+            logger.info(f"📥 RQ: Enqueued memory extraction job {memory_job.id}, meta={memory_job.meta} (depends on speaker job {speaker_job.id})")
+        elif depends_on_job:
+            logger.info(f"📥 RQ: Enqueued memory extraction job {memory_job.id}, meta={memory_job.meta} (depends on {depends_on_job.id})")
+        else:
+            logger.info(f"📥 RQ: Enqueued memory extraction job {memory_job.id}, meta={memory_job.meta} (no dependencies, starts immediately)")
     else:
-        logger.info(f"📥 RQ: Enqueued memory extraction job {memory_job.id}, meta={memory_job.meta} (no dependencies, starts immediately)")
+        logger.info(f"⏭️  Memory extraction disabled, skipping memory job for conversation {conversation_id[:8]}")
 
     # Step 3: Title/summary generation job
     # Depends on speaker job if enabled, otherwise on upstream dependency
@@ -532,8 +540,15 @@ def start_post_conversation_jobs(
     event_job_id = f"event_complete_{conversation_id[:12]}"
     logger.info(f"🔍 DEBUG: Creating conversation complete event job with job_id={event_job_id}, conversation_id={conversation_id[:12]}")
 
-    # Event job depends on both memory and title/summary jobs completing
-    # Use RQ's depends_on list to wait for both
+    # Event job depends on memory and title/summary jobs that were actually enqueued
+    # Build dependency list excluding None values
+    event_dependencies = []
+    if memory_job:
+        event_dependencies.append(memory_job)
+    if title_summary_job:
+        event_dependencies.append(title_summary_job)
+
+    # Enqueue event dispatch job (may have no dependencies if all jobs were skipped)
     event_dispatch_job = default_queue.enqueue(
         dispatch_conversation_complete_event_job,
         conversation_id,
@@ -542,16 +557,22 @@ def start_post_conversation_jobs(
         end_reason,  # Use the end_reason parameter (defaults to 'file_upload' for backward compatibility)
         job_timeout=120,  # 2 minutes
         result_ttl=JOB_RESULT_TTL,
-        depends_on=[memory_job, title_summary_job],  # Wait for both parallel jobs
+        depends_on=event_dependencies if event_dependencies else None,  # Wait for jobs that were enqueued
         job_id=event_job_id,
         description=f"Dispatch conversation complete event ({end_reason}) for {conversation_id[:8]}",
         meta=job_meta
     )
-    logger.info(f"📥 RQ: Enqueued conversation complete event job {event_dispatch_job.id}, meta={event_dispatch_job.meta} (depends on {memory_job.id} and {title_summary_job.id})")
+
+    # Log event dispatch dependencies
+    if event_dependencies:
+        dep_ids = [job.id for job in event_dependencies]
+        logger.info(f"📥 RQ: Enqueued conversation complete event job {event_dispatch_job.id}, meta={event_dispatch_job.meta} (depends on {', '.join(dep_ids)})")
+    else:
+        logger.info(f"📥 RQ: Enqueued conversation complete event job {event_dispatch_job.id}, meta={event_dispatch_job.meta} (no dependencies, starts immediately)")
 
     return {
         'speaker_recognition': speaker_job.id if speaker_job else None,
-        'memory': memory_job.id,
+        'memory': memory_job.id if memory_job else None,
         'title_summary': title_summary_job.id,
         'event_dispatch': event_dispatch_job.id
     }
diff --git a/backends/advanced/src/advanced_omi_backend/services/transcription/__init__.py b/backends/advanced/src/advanced_omi_backend/services/transcription/__init__.py
index 45773432..242deb8d 100644
--- a/backends/advanced/src/advanced_omi_backend/services/transcription/__init__.py
+++ b/backends/advanced/src/advanced_omi_backend/services/transcription/__init__.py
@@ -393,8 +393,22 @@ def get_transcription_provider(provider_name: Optional[str] = None, mode: Option
     return RegistryBatchTranscriptionProvider()
 
 
+def is_transcription_available(mode: str = "batch") -> bool:
+    """Check if transcription provider is available for given mode.
+
+    Args:
+        mode: Either "batch" or "streaming"
+
+    Returns:
+        True if a transcription provider is configured and available, False otherwise
+    """
+    provider = get_transcription_provider(mode=mode)
+    return provider is not None
+
+
 __all__ = [
     "get_transcription_provider",
+    "is_transcription_available",
     "RegistryBatchTranscriptionProvider",
     "RegistryStreamingTranscriptionProvider",
     "BaseTranscriptionProvider",
diff --git a/tests/Makefile b/tests/Makefile
index feff61a2..34fce4a2 100644
--- a/tests/Makefile
+++ b/tests/Makefile
@@ -5,7 +5,8 @@
         containers-start containers-stop containers-restart containers-rebuild \
         containers-start-rebuild containers-clean containers-status containers-logs \
         start stop restart rebuild start-rebuild status logs \
-        test test-quick test-slow test-sdk test-all-with-slow-and-sdk clean-all
+        test test-quick test-slow test-sdk test-all-with-slow-and-sdk clean-all \
+        results results-path results-detailed
 
 # Default output directory
 OUTPUTDIR ?= results
@@ -46,6 +47,11 @@ help:
 	@echo "  make containers-status        - Show container health"
 	@echo "  make containers-logs          - View service logs (use SERVICE=name)"
 	@echo ""
+	@echo "View Results:"
+	@echo "  make results          - Quick terminal summary (SSH-friendly)"
+	@echo "  make results-path     - Print path to HTML report for viewing"
+	@echo "  make results-detailed - Detailed terminal output with full errors"
+	@echo ""
 	@echo "Utilities:"
 	@echo "  make clean       - Remove test output files"
 	@echo "  make clean-all   - Clean results + containers (saves logs)"
@@ -193,5 +199,25 @@ test-all-with-slow-and-sdk:
 		--loglevel INFO:INFO \
 		$(TEST_DIR)
 
+# ============================================================================
+# View Test Results
+# ============================================================================
+
+# View test results in terminal (SSH-friendly)
+results:
+	@uv run --with-requirements test-requirements.txt python show_results.py
+
+# Print path to HTML report for manual viewing
+results-path:
+	@uv run --with-requirements test-requirements.txt python show_results.py --path
+
+# Detailed terminal output with full error messages
+results-detailed:
+	@uv run --with-requirements test-requirements.txt python show_results.py --detailed
+
+# ============================================================================
+# Cleanup
+# ============================================================================
+
 # Complete cleanup: test results + containers (saves logs)
 clean-all: clean containers-clean

From 62ee36dd2ecc2052340d69a636c68965c2841778 Mon Sep 17 00:00:00 2001
From: Ankush Malaker <43288948+AnkushMalaker@users.noreply.github.com>
Date: Thu, 22 Jan 2026 17:38:57 +0000
Subject: [PATCH 09/14] Enhance integration tests for plugin events and improve
 error handling

- Updated integration tests to filter plugin events by conversation ID, ensuring accurate event tracking and reducing noise from fixture events.
- Improved error messages in event verification to include conversation ID context, enhancing clarity during test failures.
- Refactored audio upload handling to check for transcription job creation, allowing for more robust conversation polling and error reporting.
- Added new keyword to verify conversation end reasons, improving test coverage for conversation state validation.
---
 tests/integration/plugin_event_tests.robot  | 74 ++++++++++++---------
 tests/resources/audio_keywords.robot        | 22 +++++-
 tests/resources/conversation_keywords.robot | 11 +++
 tests/resources/plugin_keywords.robot       | 64 +++++++++++++++---
 tests/resources/queue_keywords.robot        | 39 ++++++++++-
 5 files changed, 162 insertions(+), 48 deletions(-)

diff --git a/tests/integration/plugin_event_tests.robot b/tests/integration/plugin_event_tests.robot
index 35dd77ef..cdb8c2ec 100644
--- a/tests/integration/plugin_event_tests.robot
+++ b/tests/integration/plugin_event_tests.robot
@@ -52,20 +52,22 @@ Upload Audio And Verify Transcript Batch Event
     # Clear any existing events
     Clear Plugin Events
 
-    # Get baseline event count
-    ${baseline_count}=    Get Plugin Event Count    transcript.batch
-
     # Upload test audio file
     File Should Exist    ${TEST_AUDIO_FILE}
     ...    msg=Test audio file should exist
     ${conversation}=    Upload Audio File    ${TEST_AUDIO_FILE}
+    ${conversation_id}=    Set Variable    ${conversation}[conversation_id]
+
+    # Get baseline count for THIS specific conversation (should be 0 before waiting)
+    ${baseline_count}=    Set Variable    ${0}
 
     # Wait for transcription to complete (polls every 2s, max 30s)
-    ${new_events}=    Wait For Plugin Event    transcript.batch    ${baseline_count}    timeout=30s
+    # Filter by conversation_id to avoid picking up fixture conversation events
+    ${new_events}=    Wait For Plugin Event    transcript.batch    ${baseline_count}    timeout=30s    conversation_id=${conversation_id}
 
     # Verify at least one new event was received
     Should Be True    ${new_events} > 0
-    ...    msg=At least one transcript.batch event should be logged
+    ...    msg=At least one transcript.batch event should be logged for conversation ${conversation_id}
 
     # Get the events and verify structure
     ${events}=    Get Plugin Events By Type    transcript.batch
@@ -89,25 +91,26 @@ Conversation Complete Should Trigger Event
     # Clear events
     Clear Plugin Events
 
-    # Get baseline count
-    ${baseline_count}=    Get Plugin Event Count    conversation.complete
-
     # Upload audio (triggers conversation creation and completion)
     File Should Exist    ${TEST_AUDIO_FILE}
     ${conversation}=    Upload Audio File    ${TEST_AUDIO_FILE}
+    ${conversation_id}=    Set Variable    ${conversation}[conversation_id]
+
+    # Get baseline count for THIS specific conversation (should be 0 before waiting)
+    ${baseline_count}=    Set Variable    ${0}
 
     # Wait for full pipeline: transcription → conversation (polls every 2s, max 40s)
-    ${new_events}=    Wait For Plugin Event    conversation.complete    ${baseline_count}    timeout=40s
+    # Filter by conversation_id to avoid picking up fixture conversation events
+    ${new_events}=    Wait For Plugin Event    conversation.complete    ${baseline_count}    timeout=40s    conversation_id=${conversation_id}
 
     Should Be True    ${new_events} > 0
-    ...    msg=At least one conversation.complete event should be logged
+    ...    msg=At least one conversation.complete event should be logged for conversation ${conversation_id}
 
     # Verify event structure
     ${events}=    Get Plugin Events By Type    conversation.complete
     Should Not Be Empty    ${events}
 
     # Verify end_reason metadata in plugin event
-    ${conversation_id}=    Set Variable    ${conversation}[conversation_id]
     Verify Event Metadata    conversation.complete    end_reason    file_upload    ${conversation_id}
 
 Memory Processing Should Trigger Event
@@ -117,18 +120,20 @@ Memory Processing Should Trigger Event
     # Clear events
     Clear Plugin Events
 
-    # Get baseline count
-    ${baseline_count}=    Get Plugin Event Count    memory.processed
-
     # Upload audio with meaningful content for memory extraction
     File Should Exist    ${TEST_AUDIO_FILE}
     ${conversation}=    Upload Audio File    ${TEST_AUDIO_FILE}
+    ${conversation_id}=    Set Variable    ${conversation}[conversation_id]
+
+    # Get baseline count for THIS specific conversation (should be 0 before waiting)
+    ${baseline_count}=    Set Variable    ${0}
 
     # Wait for full pipeline: transcription → conversation → memory (polls every 2s, max 60s)
-    ${new_events}=    Wait For Plugin Event    memory.processed    ${baseline_count}    timeout=60s
+    # Filter by conversation_id to avoid picking up fixture conversation events
+    ${new_events}=    Wait For Plugin Event    memory.processed    ${baseline_count}    timeout=60s    conversation_id=${conversation_id}
 
     Should Be True    ${new_events} > 0
-    ...    msg=At least one memory.processed event should be logged
+    ...    msg=At least one memory.processed event should be logged for conversation ${conversation_id}
 
     # Verify event structure
     ${events}=    Get Plugin Events By Type    memory.processed
@@ -142,9 +147,6 @@ WebSocket Disconnect Should Trigger Conversation Complete Event
     # Clear events
     Clear Plugin Events
 
-    # Get baseline count
-    ${baseline_count}=    Get Plugin Event Count    conversation.complete
-
     # Open WebSocket stream
     ${stream_id}=    Open Audio Stream    device_name=plugin-test-ws
     ${client_id}=    Get Client ID From Device Name    plugin-test-ws
@@ -164,12 +166,16 @@ WebSocket Disconnect Should Trigger Conversation Complete Event
     ${total_chunks}=    Close Audio Stream Without Stop Event    ${stream_id}
     Log    Closed WebSocket stream abruptly, sent ${total_chunks} total chunks
 
+    # Get baseline count for THIS specific conversation (should be 0 before waiting)
+    ${baseline_count}=    Set Variable    ${0}
+
     # Wait for plugin event dispatch (polls every 2s, max 30s)
     # Event dispatch depends on memory and title/summary jobs completing (~20-25s total)
-    ${new_events}=    Wait For Plugin Event    conversation.complete    ${baseline_count}    timeout=30s
+    # Filter by conversation_id to avoid picking up events from other conversations
+    ${new_events}=    Wait For Plugin Event    conversation.complete    ${baseline_count}    timeout=30s    conversation_id=${conversation_id}
 
     Should Be True    ${new_events} > 0
-    ...    msg=At least one conversation.complete event should be logged
+    ...    msg=At least one conversation.complete event should be logged for conversation ${conversation_id}
 
     # Verify plugin event has correct end_reason metadata
     Verify Event Metadata    conversation.complete    end_reason    websocket_disconnect    ${conversation_id}
@@ -191,31 +197,33 @@ Verify All Events Are Logged
     # Clear all events
     Clear Plugin Events
 
-    # Get baseline counts for all event types
-    ${batch_baseline}=    Get Plugin Event Count    transcript.batch
-    ${conv_baseline}=    Get Plugin Event Count    conversation.complete
-    ${mem_baseline}=    Get Plugin Event Count    memory.processed
-
     # Upload audio file (should trigger all events)
     File Should Exist    ${TEST_AUDIO_FILE}
     ${conversation}=    Upload Audio File    ${TEST_AUDIO_FILE}
+    ${conversation_id}=    Set Variable    ${conversation}[conversation_id]
+
+    # Get baseline counts for THIS specific conversation (should be 0 for each)
+    ${batch_baseline}=    Set Variable    ${0}
+    ${conv_baseline}=    Set Variable    ${0}
+    ${mem_baseline}=    Set Variable    ${0}
 
     # Wait for events in pipeline order (polls every 2s for each)
-    ${batch_new}=    Wait For Plugin Event    transcript.batch    ${batch_baseline}    timeout=30s
-    ${conv_new}=    Wait For Plugin Event    conversation.complete    ${conv_baseline}    timeout=30s
-    ${mem_new}=    Wait For Plugin Event    memory.processed    ${mem_baseline}    timeout=60s
+    # Filter by conversation_id to avoid picking up fixture conversation events
+    ${batch_new}=    Wait For Plugin Event    transcript.batch    ${batch_baseline}    timeout=30s    conversation_id=${conversation_id}
+    ${conv_new}=    Wait For Plugin Event    conversation.complete    ${conv_baseline}    timeout=30s    conversation_id=${conversation_id}
+    ${mem_new}=    Wait For Plugin Event    memory.processed    ${mem_baseline}    timeout=60s    conversation_id=${conversation_id}
 
     Should Be True    ${batch_new} > 0
-    ...    msg=transcript.batch events should be logged
+    ...    msg=transcript.batch events should be logged for conversation ${conversation_id}
 
     Should Be True    ${conv_new} > 0
-    ...    msg=conversation.complete events should be logged
+    ...    msg=conversation.complete events should be logged for conversation ${conversation_id}
 
     Should Be True    ${mem_new} > 0
-    ...    msg=memory.processed events should be logged
+    ...    msg=memory.processed events should be logged for conversation ${conversation_id}
 
     # Log summary
-    Log    Events logged - Batch: ${batch_new}, Conversation: ${conv_new}, Memory: ${mem_new}
+    Log    Events logged for conversation ${conversation_id} - Batch: ${batch_new}, Conversation: ${conv_new}, Memory: ${mem_new}
 
 *** Keywords ***
 Test Suite Setup
diff --git a/tests/resources/audio_keywords.robot b/tests/resources/audio_keywords.robot
index d2b8ac81..c752e511 100644
--- a/tests/resources/audio_keywords.robot
+++ b/tests/resources/audio_keywords.robot
@@ -65,15 +65,31 @@ Upload Audio File
       Log    Conversation ID: ${job_id}
       Log    Transcript Job ID: ${transcript_job_id}
 
-      # Wait for conversation to be created and transcribed
-      Log    Waiting for transcription to complete...
+      # Check if transcript_job_id is None (job not created)
+      ${is_none}=    Evaluate    $transcript_job_id is None or str($transcript_job_id) == 'None'
+
+      IF    ${is_none}
+          # Transcript job not created - skip job waiting and poll for conversation directly
+          Log    Transcript job ID is None - transcription job not created. Polling for conversation directly...
+
+          # Poll for conversation to appear (max 60s)
+          Wait Until Keyword Succeeds    60s    5s
+          ...    Get Conversation By ID    ${job_id}
+
+          ${conversation}=    Get Conversation By ID    ${job_id}
+          Log    Found conversation (without job tracking): ${conversation}
+          RETURN    ${conversation}
+      END
+
+      # Normal path: Wait for transcription job to complete
+      Log    Waiting for transcription job ${transcript_job_id} to complete...
 
       Wait Until Keyword Succeeds    60s    5s       Check job status   ${transcript_job_id}    finished
       ${job}=    Get Job Details    ${transcript_job_id}
 
      # Get the finished conversation
       ${conversation}=     Get Conversation By ID    ${job}[result][conversation_id]
-      Should Not Be Equal    ${conversation}    ${None}    Conversation not found after upload and started
+      Should Not Be Equal    ${conversation}    ${None}    Conversation not found after upload and processing
 
       Log    Found conversation: ${conversation}
       RETURN    ${conversation}
diff --git a/tests/resources/conversation_keywords.robot b/tests/resources/conversation_keywords.robot
index 5aea9aee..746565ee 100644
--- a/tests/resources/conversation_keywords.robot
+++ b/tests/resources/conversation_keywords.robot
@@ -167,3 +167,14 @@ Check Conversation Has End Reason
     ${end_reason}=    Set Variable    ${conversation}[end_reason]
     Should Not Be Equal As Strings    ${end_reason}    None    msg=End reason not set yet
     RETURN    ${conversation}
+
+Conversation Should Have End Reason
+    [Documentation]    Verify conversation has specific end_reason value
+    ...
+    ...    This keyword checks if the conversation's end_reason field matches the expected value.
+    [Arguments]    ${conversation_id}    ${expected_end_reason}
+
+    ${conversation}=    Get Conversation By ID    ${conversation_id}
+    ${actual_end_reason}=    Set Variable    ${conversation}[end_reason]
+    Should Be Equal As Strings    ${actual_end_reason}    ${expected_end_reason}
+    ...    msg=Expected end_reason '${expected_end_reason}', got '${actual_end_reason}'
diff --git a/tests/resources/plugin_keywords.robot b/tests/resources/plugin_keywords.robot
index 9d0a6df9..4e8d52d0 100644
--- a/tests/resources/plugin_keywords.robot
+++ b/tests/resources/plugin_keywords.robot
@@ -150,10 +150,11 @@ Wait For Plugin Event
     ...    - baseline_count: The event count before the operation started
     ...    - timeout: Maximum time to wait (default: 30s)
     ...    - retry_interval: Time between polling attempts (default: 2s)
-    [Arguments]    ${event_type}    ${baseline_count}    ${timeout}=30s    ${retry_interval}=2s
+    ...    - conversation_id: Optional conversation_id to filter events (default: empty)
+    [Arguments]    ${event_type}    ${baseline_count}    ${timeout}=30s    ${retry_interval}=2s    ${conversation_id}=${EMPTY}
 
     Wait Until Keyword Succeeds    ${timeout}    ${retry_interval}
-    ...    Plugin Event Count Should Be Greater Than    ${event_type}    ${baseline_count}
+    ...    Plugin Event Count Should Be Greater Than    ${event_type}    ${baseline_count}    ${conversation_id}
 
     # After successful wait, get the final count
     ${current_count}=    Get Plugin Event Count    ${event_type}
@@ -165,12 +166,37 @@ Plugin Event Count Should Be Greater Than
     ...
     ...    This keyword is used by Wait For Plugin Event for polling.
     ...    It will fail (causing a retry) until the condition is met.
-    [Arguments]    ${event_type}    ${baseline_count}
+    ...    Optionally filters by conversation_id if provided.
+    [Arguments]    ${event_type}    ${baseline_count}    ${conversation_id}=${EMPTY}
+
+    # Get all events of this type
+    ${events}=    Get Plugin Events By Type    ${event_type}
+
+    # If conversation_id filter specified, filter events
+    IF    '${conversation_id}' != ''
+        ${filtered_events}=    Create List
+        FOR    ${event}    IN    @{events}
+            ${event_data}=    Set Variable    ${event}[data]
+            ${event_conv_id}=    Evaluate    $event_data.get('conversation_id', '')
+            IF    '${event_conv_id}' == '${conversation_id}'
+                Append To List    ${filtered_events}    ${event}
+            END
+        END
+        ${current_count}=    Get Length    ${filtered_events}
+    ELSE
+        ${current_count}=    Get Length    ${events}
+    END
 
-    ${current_count}=    Get Plugin Event Count    ${event_type}
     ${new_events}=    Evaluate    ${current_count} - ${baseline_count}
-    Should Be True    ${new_events} > 0
-    ...    msg=Expected new ${event_type} events, but count is still ${current_count} (baseline: ${baseline_count})
+
+    # Build error message with conversation_id context if filtering
+    IF    '${conversation_id}' != ''
+        ${error_msg}=    Set Variable    Expected new ${event_type} events for conversation ${conversation_id}, but count is still ${current_count} (baseline: ${baseline_count})
+    ELSE
+        ${error_msg}=    Set Variable    Expected new ${event_type} events, but count is still ${current_count} (baseline: ${baseline_count})
+    END
+
+    Should Be True    ${new_events} > 0    msg=${error_msg}
 
     RETURN    ${new_events}
 
@@ -205,14 +231,23 @@ Verify Event Metadata
     Should Not Be Empty    ${events}
     ...    msg=No events found for event type '${event_type}'
 
+    # Collect conversation IDs for better error messages
+    ${found_conv_ids}=    Create List
+    ${found_metadata_values}=    Create List
+
     # Find matching event (optionally filtered by conversation_id)
     ${found}=    Set Variable    ${False}
     FOR    ${event}    IN    @{events}
+        # Track conversation_id for debugging
+        ${event_data}=    Set Variable    ${event}[data]
+        ${event_conv_id}=    Evaluate    $event_data.get('conversation_id', '')
+        IF    '${event_conv_id}' != ''
+            Append To List    ${found_conv_ids}    ${event_conv_id}
+        END
+
         # If conversation_id filter specified, check if this is the right conversation
         ${is_match}=    Set Variable    ${True}
         IF    '${conversation_id}' != ''
-            ${event_data}=    Set Variable    ${event}[data]
-            ${event_conv_id}=    Evaluate    $event_data.get('conversation_id', '')
             IF    '${event_conv_id}' != '${conversation_id}'
                 ${is_match}=    Set Variable    ${False}
             END
@@ -224,6 +259,7 @@ Verify Event Metadata
             Dictionary Should Contain Key    ${event_metadata}    ${metadata_key}
             ...    msg=Event metadata missing key '${metadata_key}'
             ${actual_value}=    Get From Dictionary    ${event_metadata}    ${metadata_key}
+            Append To List    ${found_metadata_values}    ${actual_value}
             IF    '${actual_value}' == '${expected_value}'
                 ${found}=    Set Variable    ${True}
                 BREAK
@@ -231,5 +267,13 @@ Verify Event Metadata
         END
     END
 
-    Should Be True    ${found}
-    ...    msg=No events found with metadata '${metadata_key}=${expected_value}' for event type '${event_type}'
+    # Build detailed error message if not found
+    IF    not ${found}
+        ${unique_conv_ids}=    Evaluate    list(set($found_conv_ids))
+        IF    '${conversation_id}' != ''
+            ${error_msg}=    Set Variable    No events found with metadata '${metadata_key}=${expected_value}' for conversation '${conversation_id}'. Found conversation IDs: ${unique_conv_ids}. Found metadata values: ${found_metadata_values}
+        ELSE
+            ${error_msg}=    Set Variable    No events found with metadata '${metadata_key}=${expected_value}' for event type '${event_type}'. Found conversation IDs: ${unique_conv_ids}. Found metadata values: ${found_metadata_values}
+        END
+        Fail    ${error_msg}
+    END
diff --git a/tests/resources/queue_keywords.robot b/tests/resources/queue_keywords.robot
index 5ba91bf0..b6678bf7 100644
--- a/tests/resources/queue_keywords.robot
+++ b/tests/resources/queue_keywords.robot
@@ -23,8 +23,16 @@ Get queue length
 
 Get Job Details
     [Documentation]    Get job details from the queue API by searching the jobs list
+    ...                Returns None if job not found
+    ...                Handles None job_id gracefully with clear error message
     [Arguments]    ${job_id}
 
+    # Check if job_id is None before attempting to query
+    ${is_none}=    Evaluate    $job_id is None or str($job_id) == 'None'
+    IF    ${is_none}
+        Fail    Cannot get job details: job_id is None. This usually means the job was not created successfully (check API response for errors).
+    END
+
     ${response}=    GET On Session    api    /api/queue/jobs
     Should Be Equal As Integers    ${response.status_code}    200
     ${jobs_data}=    Set Variable    ${response.json()}
@@ -38,17 +46,28 @@ Get Job Details
     END
 
     # If we get here, job not found - return None
+    Log    Job with ID '${job_id}' not found in queue    WARN
     RETURN    ${None}
 
 Get Job Status
     [Documentation]    Get just the status of a specific job by ID (lightweight endpoint)
+    ...                Returns None if job not found or if job_id is None
+    ...                Handles None job_id gracefully by returning None
     [Arguments]    ${job_id}
 
+    # Check if job_id is None - return None instead of failing
+    ${is_none}=    Evaluate    $job_id is None or str($job_id) == 'None'
+    IF    ${is_none}
+        Log    Job ID is None, cannot get status    WARN
+        RETURN    ${None}
+    END
+
     # Use the lightweight status endpoint - try to get the response
     ${success}=    Run Keyword And Return Status    GET On Session    api    /api/queue/jobs/${job_id}/status    expected_status=200
 
     IF    not ${success}
         # Job not found
+        Log    Job with ID '${job_id}' not found    DEBUG
         RETURN    ${None}
     END
 
@@ -60,12 +79,21 @@ Get Job Status
 Check job status
     [Documentation]    Check the status of a specific job by ID
     ...                Fails immediately if job is in 'failed' state when expecting 'finished'
+    ...                Handles None job_id gracefully with clear error message
     [Arguments]    ${job_id}    ${expected_status}
 
+    # Check if job_id is None or 'None' string before attempting to query
+    ${is_none}=    Evaluate    $job_id is None or str($job_id) == 'None'
+    IF    ${is_none}
+        Fail    Cannot check job status: job_id is None. This usually means the job was not created successfully (check API response for errors).
+    END
+
     ${job}=    Get Job status    ${job_id}
 
-    # If job is None (not found), fail explicitly
-    Should Not Be Equal    ${job}[job_id]    ${None}    Job with ID ${job_id} not found in queue
+    # If job is None (not found), fail explicitly with context
+    IF    ${job} == ${None}
+        Fail    Job with ID '${job_id}' not found in queue. The job may have expired, been flushed, or never existed.
+    END
 
     ${actual_status}=    Set Variable    ${job}[status]
     Log    Job ${job_id} status: ${actual_status} (expected: ${expected_status})
@@ -142,8 +170,15 @@ Find Job For Client
 
 Wait For Job Status
     [Documentation]    Wait for a job to reach a specific status
+    ...                Handles None job_id gracefully with clear error message
     [Arguments]    ${job_id}    ${expected_status}    ${timeout}=60s    ${interval}=5s
 
+    # Check if job_id is None before waiting (fail fast with clear message)
+    ${is_none}=    Evaluate    $job_id is None or str($job_id) == 'None'
+    IF    ${is_none}
+        Fail    Cannot wait for job status: job_id is None. This usually means the job was not created successfully (check API response for errors).
+    END
+
     Wait Until Keyword Succeeds    ${timeout}    ${interval}
     ...    Check job status    ${job_id}    ${expected_status}
 

From 64887a2d3e388f4c56e8c91fe3292e5b8337f529 Mon Sep 17 00:00:00 2001
From: Ankush Malaker <43288948+AnkushMalaker@users.noreply.github.com>
Date: Fri, 23 Jan 2026 04:59:48 +0000
Subject: [PATCH 10/14] Enhance speaker recognition testing and audio
 processing

- Added mock speaker recognition client to facilitate testing without resource-intensive dependencies.
- Updated Docker Compose configurations to include mock speaker client for test environments.
- Refactored audio segment reconstruction to ensure precise clipping based on time boundaries.
- Improved error handling in transcription jobs and speaker recognition workflows to enhance robustness.
- Adjusted integration tests to utilize real-time pacing for audio chunk streaming, improving test accuracy.
---
 backends/advanced/docker-compose-test.yml     |   4 +
 .../services/transcription/__init__.py        |  40 +----
 .../speaker_recognition_client.py             |  29 ++++
 .../utils/audio_chunk_utils.py                |  53 +++++-
 .../workers/conversation_jobs.py              |  16 ++
 .../workers/speaker_jobs.py                   |  17 +-
 .../workers/transcription_jobs.py             |  63 +------
 .../webui/src/pages/Conversations.tsx         |  51 ++----
 .../docker-compose-test.yml                   |   8 +-
 .../api/routers/identification.py             |   8 +-
 .../websocket_transcription_e2e_test.robot    |   4 +-
 tests/mocks/__init__.py                       |   1 +
 tests/mocks/mock_speaker_client.py            | 160 ++++++++++++++++++
 tests/setup/test_manager_keywords.robot       |   2 +-
 14 files changed, 301 insertions(+), 155 deletions(-)
 create mode 100644 tests/mocks/__init__.py
 create mode 100644 tests/mocks/mock_speaker_client.py

diff --git a/backends/advanced/docker-compose-test.yml b/backends/advanced/docker-compose-test.yml
index bb2ac530..7e0ad0b6 100644
--- a/backends/advanced/docker-compose-test.yml
+++ b/backends/advanced/docker-compose-test.yml
@@ -58,6 +58,8 @@ services:
       - SPEECH_DETECTION_MIN_WORDS=5  # 5 words instead of 10
       # Wait for audio queue to drain before timing out (test mode)
       - WAIT_FOR_AUDIO_QUEUE_DRAIN=true
+      # Mock speaker recognition for tests (avoids resource-intensive ML service)
+      - USE_MOCK_SPEAKER_CLIENT=true
     depends_on:
       qdrant-test:
         condition: service_started
@@ -209,6 +211,8 @@ services:
       - SPEECH_DETECTION_MIN_WORDS=5  # 5 words instead of 10
       # Wait for audio queue to drain before timing out (test mode)
       - WAIT_FOR_AUDIO_QUEUE_DRAIN=true
+      # Mock speaker recognition for tests (avoids resource-intensive ML service)
+      - USE_MOCK_SPEAKER_CLIENT=true
     depends_on:
       chronicle-backend-test:
         condition: service_healthy
diff --git a/backends/advanced/src/advanced_omi_backend/services/transcription/__init__.py b/backends/advanced/src/advanced_omi_backend/services/transcription/__init__.py
index 242deb8d..4bfae311 100644
--- a/backends/advanced/src/advanced_omi_backend/services/transcription/__init__.py
+++ b/backends/advanced/src/advanced_omi_backend/services/transcription/__init__.py
@@ -142,43 +142,9 @@ async def transcribe(self, audio_data: bytes, sample_rate: int, diarize: bool =
             words = _dotted_get(data, extract.get("words")) or []
             segments = _dotted_get(data, extract.get("segments")) or []
 
-            # DEBUG: Log what we extracted
-            logger.debug(f"DEBUG Registry: Extracted {len(segments)} segments from response")
-            if segments and len(segments) > 0:
-                logger.debug(f"DEBUG Registry: First segment keys: {list(segments[0].keys()) if isinstance(segments[0], dict) else 'not a dict'}")
-                logger.debug(f"DEBUG Registry: First segment: {segments[0]}")
-
-            # FIX: Normalize Deepgram segment structure
-            provider = self.model.model_provider.lower() if self.model.model_provider else ""
-            if provider == "deepgram" and segments:
-                normalized_segments = []
-                for seg in segments:
-                    # Deepgram segments may have nested structure
-                    # Extract text from either 'text' or 'transcript' or 'sentences'
-                    text_content = seg.get("text") or seg.get("transcript") or ""
-
-                    # Handle nested sentences structure
-                    if not text_content and "sentences" in seg:
-                        sentences = seg.get("sentences", [])
-                        text_content = " ".join([s.get("text", "") for s in sentences if s.get("text")])
-
-                    # Skip empty segments
-                    if not text_content or not text_content.strip():
-                        logger.debug(f"Skipping empty Deepgram segment: {seg}")
-                        continue
-
-                    # Build normalized segment
-                    normalized_seg = {
-                        "text": text_content.strip(),
-                        "start": seg.get("start", 0.0),
-                        "end": seg.get("end", 0.0),
-                        "speaker": seg.get("speaker", "SPEAKER_00"),
-                        "confidence": seg.get("confidence", 1.0)
-                    }
-                    normalized_segments.append(normalized_seg)
-
-                segments = normalized_segments
-                logger.debug(f"Normalized {len(segments)} Deepgram segments")
+            # Ignore segments from all providers - speaker service creates them via diarization
+            segments = []
+            logger.debug(f"Transcription: Extracted {len(words)} words, ignoring provider segments (speaker service will create them)")
 
         return {"text": text, "words": words, "segments": segments}
 
diff --git a/backends/advanced/src/advanced_omi_backend/speaker_recognition_client.py b/backends/advanced/src/advanced_omi_backend/speaker_recognition_client.py
index 8dbada0b..d58b2a5d 100644
--- a/backends/advanced/src/advanced_omi_backend/speaker_recognition_client.py
+++ b/backends/advanced/src/advanced_omi_backend/speaker_recognition_client.py
@@ -36,6 +36,29 @@ def __init__(self, service_url: Optional[str] = None):
             service_url: URL of the speaker recognition service (e.g., http://speaker-service:8085)
                         If not provided, uses config.yml service_url or SPEAKER_SERVICE_URL env var
         """
+        # Check if we should use mock client (for testing)
+        if os.getenv("USE_MOCK_SPEAKER_CLIENT") == "true":
+            try:
+                # Import mock client from tests directory
+                import sys
+                from pathlib import Path
+
+                # Add tests directory to Python path
+                tests_dir = Path(__file__).resolve().parents[5] / "tests"
+                if str(tests_dir) not in sys.path:
+                    sys.path.insert(0, str(tests_dir))
+
+                from mocks.mock_speaker_client import MockSpeakerRecognitionClient
+
+                self._mock_client = MockSpeakerRecognitionClient()
+                self.enabled = True
+                self.service_url = "mock://speaker-service"
+                logger.info("🎤 Using MOCK speaker recognition client for tests")
+                return
+            except ImportError as e:
+                logger.error(f"Failed to import mock speaker client: {e}")
+                # Fall through to normal initialization
+
         # Load speaker recognition config from config.yml
         registry = get_models_registry()
         if not registry or not registry.speaker_recognition:
@@ -88,6 +111,12 @@ async def diarize_identify_match(
         Returns:
             Dictionary containing segments with matched text and speaker identification
         """
+        # Use mock client if configured
+        if hasattr(self, '_mock_client'):
+            return await self._mock_client.diarize_identify_match(
+                conversation_id, backend_token, transcript_data, user_id
+            )
+
         if not self.enabled:
             logger.info(f"🎤 Speaker recognition disabled, returning empty result")
             return {"segments": []}
diff --git a/backends/advanced/src/advanced_omi_backend/utils/audio_chunk_utils.py b/backends/advanced/src/advanced_omi_backend/utils/audio_chunk_utils.py
index 406389a7..28581d09 100644
--- a/backends/advanced/src/advanced_omi_backend/utils/audio_chunk_utils.py
+++ b/backends/advanced/src/advanced_omi_backend/utils/audio_chunk_utils.py
@@ -587,20 +587,63 @@ async def reconstruct_audio_segment(
             channels=channels,
         )
 
-    # Decode and concatenate chunks
-    pcm_data = await concatenate_chunks_to_pcm(chunks)
+    # Decode each chunk and clip to exact time boundaries for precise segment extraction
+    pcm_buffer = bytearray()
+    bytes_per_second = sample_rate * channels * 2  # 16-bit = 2 bytes per sample
 
-    # Build WAV file for this segment
+    for chunk in chunks:
+        # Decode this chunk to PCM
+        pcm_data = await decode_opus_to_pcm(
+            opus_data=chunk.audio_data,
+            sample_rate=chunk.sample_rate,
+            channels=chunk.channels,
+        )
+
+        # Calculate clip boundaries for this chunk
+        clip_start_byte = 0
+        clip_end_byte = len(pcm_data)
+
+        # Trim start if chunk begins before requested start_time
+        if chunk.start_time < start_time:
+            offset_seconds = start_time - chunk.start_time
+            offset_bytes = int(offset_seconds * bytes_per_second)
+            # Align to sample boundary (2 bytes for 16-bit audio)
+            clip_start_byte = (offset_bytes // 2) * 2
+
+        # Trim end if chunk extends past requested end_time
+        if chunk.end_time > end_time:
+            # Calculate duration from chunk start to requested end
+            duration_seconds = end_time - chunk.start_time
+            duration_bytes = int(duration_seconds * bytes_per_second)
+            # Align to sample boundary
+            clip_end_byte = (duration_bytes // 2) * 2
+
+        # Append only the clipped portion to buffer
+        if clip_start_byte < clip_end_byte:
+            clipped_pcm = pcm_data[clip_start_byte:clip_end_byte]
+            pcm_buffer.extend(clipped_pcm)
+
+            logger.debug(
+                f"Chunk {chunk.chunk_index}: [{chunk.start_time:.1f}s - {chunk.end_time:.1f}s] "
+                f"→ clipped [{max(chunk.start_time, start_time):.1f}s - {min(chunk.end_time, end_time):.1f}s] "
+                f"({len(clipped_pcm)} bytes)"
+            )
+
+    # Build WAV file from precisely trimmed PCM data
     wav_bytes = await build_wav_from_pcm(
-        pcm_data=pcm_data,
+        pcm_data=bytes(pcm_buffer),
         sample_rate=sample_rate,
         channels=channels,
     )
 
+    actual_duration = len(pcm_buffer) / bytes_per_second
+    expected_duration = end_time - start_time
+
     logger.info(
         f"Reconstructed audio segment for {conversation_id[:8]}...: "
         f"{start_time:.1f}s - {end_time:.1f}s "
-        f"({len(chunks)} chunks, {len(wav_bytes)} bytes)"
+        f"({len(chunks)} chunks, {len(wav_bytes)} bytes WAV, "
+        f"actual duration: {actual_duration:.2f}s, expected: {expected_duration:.2f}s)"
     )
 
     return wav_bytes
diff --git a/backends/advanced/src/advanced_omi_backend/workers/conversation_jobs.py b/backends/advanced/src/advanced_omi_backend/workers/conversation_jobs.py
index beaabbef..063d00b7 100644
--- a/backends/advanced/src/advanced_omi_backend/workers/conversation_jobs.py
+++ b/backends/advanced/src/advanced_omi_backend/workers/conversation_jobs.py
@@ -16,6 +16,7 @@
 from advanced_omi_backend.controllers.queue_controller import redis_conn
 from advanced_omi_backend.controllers.session_controller import mark_session_complete
 from advanced_omi_backend.services.plugin_service import get_plugin_router, init_plugin_router
+from datetime import datetime
 
 from advanced_omi_backend.utils.conversation_utils import (
     analyze_speech,
@@ -873,6 +874,21 @@ async def dispatch_conversation_complete_event_job(
         logger.error(f"Conversation {conversation_id} not found")
         return {"success": False, "error": "Conversation not found"}
 
+    # Save end_reason and completed_at to database if not already set
+    # This ensures end_reason is persisted before plugins receive conversation.complete event
+    if end_reason and conversation.end_reason is None:
+        try:
+            conversation.end_reason = Conversation.EndReason(end_reason)
+        except ValueError:
+            logger.warning(f"⚠️ Invalid end_reason '{end_reason}', using UNKNOWN")
+            conversation.end_reason = Conversation.EndReason.UNKNOWN
+
+        if conversation.completed_at is None:
+            conversation.completed_at = datetime.utcnow()
+
+        await conversation.save()
+        logger.info(f"💾 Saved end_reason={conversation.end_reason} to conversation {conversation_id[:12]} in event dispatch job")
+
     # Get user email for event data
     from advanced_omi_backend.models.user import User
     user = await User.get(user_id)
diff --git a/backends/advanced/src/advanced_omi_backend/workers/speaker_jobs.py b/backends/advanced/src/advanced_omi_backend/workers/speaker_jobs.py
index fe130c28..338bdf4b 100644
--- a/backends/advanced/src/advanced_omi_backend/workers/speaker_jobs.py
+++ b/backends/advanced/src/advanced_omi_backend/workers/speaker_jobs.py
@@ -207,18 +207,11 @@ async def recognise_speakers_job(
     actual_transcript_text = transcript_text or transcript_version.transcript or ""
     actual_words = words if words else []
 
-    # If words not provided, extract from segments (single source of truth)
-    if not actual_words and transcript_version.segments:
-        actual_words = []
-        for seg in transcript_version.segments:
-            for word in seg.words:
-                actual_words.append({
-                    "word": word.word,
-                    "start": word.start,
-                    "end": word.end,
-                    "confidence": word.confidence
-                })
-        logger.info(f"🔤 Extracted {len(actual_words)} words from {len(transcript_version.segments)} segments")
+    # If words not provided, read from transcript version metadata
+    # (Transcription job stores words in metadata since segments are created by speaker service)
+    if not actual_words and transcript_version.metadata:
+        actual_words = transcript_version.metadata.get("words", [])
+        logger.info(f"🔤 Loaded {len(actual_words)} words from transcript version metadata")
 
     if not actual_transcript_text:
         logger.warning(f"🎤 No transcript text found in version {version_id}")
diff --git a/backends/advanced/src/advanced_omi_backend/workers/transcription_jobs.py b/backends/advanced/src/advanced_omi_backend/workers/transcription_jobs.py
index 27eb3814..3d5aef5f 100644
--- a/backends/advanced/src/advanced_omi_backend/workers/transcription_jobs.py
+++ b/backends/advanced/src/advanced_omi_backend/workers/transcription_jobs.py
@@ -357,71 +357,22 @@ async def transcribe_full_audio_job(
     # Calculate processing time (transcription only)
     processing_time = time.time() - start_time
 
-    # Convert segments to SpeakerSegment objects
+    # Transcription only provides text + words with timestamps
+    # Speaker service will create segments via diarization
     speaker_segments = []
-
-    if segments:
-        # Use provided segments
-        for seg in segments:
-            # Use identified_as if available (from speaker recognition), otherwise use speaker label
-            speaker_id = seg.get("identified_as") or seg.get("speaker", "Unknown")
-            # Convert speaker ID to string if it's an integer (some providers return int speaker IDs)
-            speaker_name = f"Speaker {speaker_id}" if isinstance(speaker_id, int) else speaker_id
-
-            speaker_segments.append(
-                Conversation.SpeakerSegment(
-                    start=seg.get("start", 0),
-                    end=seg.get("end", 0),
-                    text=seg.get("text", ""),
-                    speaker=speaker_name,
-                    confidence=seg.get("confidence"),
-                )
-            )
-    elif transcript_text:
-        # Fallback: If no segments but we have text, create a single segment from the full transcript
-        # This handles providers that don't support segmentation
-        # Calculate duration from words if available, otherwise estimate from audio
-        start_time_seg = 0.0
-        end_time_seg = 0.0
-
-        if words:
-            # Use word timestamps if available
-            start_times = [w.get("start", 0) for w in words if "start" in w]
-            end_times = [w.get("end", 0) for w in words if "end" in w]
-            if start_times:
-                start_time_seg = min(start_times)
-            if end_times:
-                end_time_seg = max(end_times)
-        else:
-            # Estimate duration: assume ~150 words per minute, or use audio file duration
-            # For now, use a default duration if we can't calculate it
-            end_time_seg = len(transcript_text.split()) * 0.4  # Rough estimate: 0.4s per word
-
-        speaker_segments.append(
-            Conversation.SpeakerSegment(
-                start=start_time_seg,
-                end=end_time_seg if end_time_seg > start_time_seg else start_time_seg + 1.0,
-                text=transcript_text,
-                speaker="Unknown",
-                confidence=None,
-            )
-        )
-        logger.info(
-            f"📊 Created single segment from transcript text (no segments returned by provider)"
-        )
-
-    logger.info(f"📊 Created {len(speaker_segments)} speaker segments")
+    logger.info(f"📊 Transcription complete: {len(words)} words (segments will be created by speaker service)")
 
     # Add new transcript version
     provider_normalized = provider_name.lower() if provider_name else "unknown"
 
-    # Prepare metadata (transcription only - speaker recognition will add its own metadata)
+    # Prepare metadata (transcription only - speaker service will add segments and metadata)
+    # Store words in metadata so speaker job can access them
     metadata = {
         "trigger": trigger,
         "audio_file_size": len(wav_data),
-        "segment_count": len(segments),
         "word_count": len(words),
-        "speaker_recognition": {"enabled": False, "reason": "handled_by_separate_job"},
+        "segments_created_by": "speaker_service",  # Speaker service creates segments via diarization
+        "words": words,  # Store word-level timing data for speaker job
     }
 
     conversation.add_transcript_version(
diff --git a/backends/advanced/webui/src/pages/Conversations.tsx b/backends/advanced/webui/src/pages/Conversations.tsx
index 9eb27f94..4f3e1b2e 100644
--- a/backends/advanced/webui/src/pages/Conversations.tsx
+++ b/backends/advanced/webui/src/pages/Conversations.tsx
@@ -63,7 +63,6 @@ export default function Conversations() {
   const [playingSegment, setPlayingSegment] = useState<string | null>(null) // Format: "audioUuid-segmentIndex"
   const [audioCurrentTime, setAudioCurrentTime] = useState<{ [conversationId: string]: number }>({})
   const audioRefs = useRef<{ [key: string]: HTMLAudioElement }>({})
-  const segmentTimerRef = useRef<number | null>(null)
 
   // Reprocessing state
   const [openDropdown, setOpenDropdown] = useState<string | null>(null)
@@ -434,49 +433,41 @@ export default function Conversations() {
 
   const handleSegmentPlayPause = (conversationId: string, segmentIndex: number, segment: any) => {
     const segmentId = `${conversationId}-${segmentIndex}`;
-    const audioKey = conversationId; // Use conversation ID as cache key
 
     // If this segment is already playing, pause it
     if (playingSegment === segmentId) {
-      const audio = audioRefs.current[audioKey];
+      const audio = audioRefs.current[segmentId];
       if (audio) {
         audio.pause();
       }
-      if (segmentTimerRef.current) {
-        window.clearTimeout(segmentTimerRef.current);
-        segmentTimerRef.current = null;
-      }
       setPlayingSegment(null);
       return;
     }
 
     // Stop any currently playing segment
     if (playingSegment) {
-      // Stop all audio elements
-      Object.values(audioRefs.current).forEach(audio => {
-        audio.pause();
-      });
-      if (segmentTimerRef.current) {
-        window.clearTimeout(segmentTimerRef.current);
-        segmentTimerRef.current = null;
+      const currentAudio = audioRefs.current[playingSegment];
+      if (currentAudio) {
+        currentAudio.pause();
       }
     }
 
-    // Get or create audio element for this conversation
-    let audio = audioRefs.current[audioKey];
+    // Get or create audio element for this specific segment
+    let audio = audioRefs.current[segmentId];
 
-    // Check if we need to create a new audio element (none exists or previous had error)
+    // Create new audio element with segment-specific URL
     if (!audio || audio.error) {
       const token = localStorage.getItem(getStorageKey('token')) || '';
-      const audioUrl = `${BACKEND_URL}/api/audio/get_audio/${conversationId}?token=${token}`;
-      console.log('Creating audio element with URL:', audioUrl);
-      console.log('Token present:', !!token, 'Token length:', token.length);
+      // Use chunks endpoint with time range for instant loading (only fetches needed chunks)
+      const audioUrl = `${BACKEND_URL}/api/audio/chunks/${conversationId}?start_time=${segment.start}&end_time=${segment.end}&token=${token}`;
+      console.log('Creating segment audio element with URL:', audioUrl);
+      console.log('Segment range:', segment.start, 'to', segment.end, '(duration:', segment.end - segment.start, 'seconds)');
       audio = new Audio(audioUrl);
-      audioRefs.current[audioKey] = audio;
+      audioRefs.current[segmentId] = audio;
 
       // Add error listener for debugging
       audio.addEventListener('error', () => {
-        console.error('Audio element error:', audio.error?.code, audio.error?.message);
+        console.error('Audio segment error:', audio.error?.code, audio.error?.message);
         console.error('Audio src:', audio.src);
       });
 
@@ -486,19 +477,10 @@ export default function Conversations() {
       });
     }
 
-    // Set the start time and play
+    // Play the segment (no need to seek since audio is already trimmed to exact range)
     console.log('Playing segment:', segment.start, 'to', segment.end);
-    audio.currentTime = segment.start;
     audio.play().then(() => {
       setPlayingSegment(segmentId);
-
-      // Set a timer to stop at the segment end time
-      const duration = (segment.end - segment.start) * 1000; // Convert to milliseconds
-      segmentTimerRef.current = window.setTimeout(() => {
-        audio.pause();
-        setPlayingSegment(null);
-        segmentTimerRef.current = null;
-      }, duration);
     }).catch(err => {
       console.error('Error playing audio segment:', err);
       setPlayingSegment(null);
@@ -508,13 +490,10 @@ export default function Conversations() {
   // Cleanup audio on unmount
   useEffect(() => {
     return () => {
-      // Stop all audio and clear timers
+      // Stop all audio elements
       Object.values(audioRefs.current).forEach(audio => {
         audio.pause();
       });
-      if (segmentTimerRef.current) {
-        window.clearTimeout(segmentTimerRef.current);
-      }
     };
   }, [])
 
diff --git a/extras/speaker-recognition/docker-compose-test.yml b/extras/speaker-recognition/docker-compose-test.yml
index 1687dd41..5c11573d 100644
--- a/extras/speaker-recognition/docker-compose-test.yml
+++ b/extras/speaker-recognition/docker-compose-test.yml
@@ -8,8 +8,8 @@ services:
         PYTORCH_CUDA_VERSION: ${COMPUTE_MODE:-cpu}
     image: speaker-recognition:test
     ports:
-      # Map host test port (default 8086) to container port 8085
-      - "${SPEAKER_SERVICE_TEST_PORT:-8086}:8085"
+      # Map host test port (default 8086) to container port 8086
+      - "${SPEAKER_SERVICE_TEST_PORT:-8086}:8086"
     volumes:
       # Mount source code for development (live reload)
       - ./src:/app/src
@@ -26,12 +26,12 @@ services:
       - HF_TOKEN=${HF_TOKEN}
       - SIMILARITY_THRESHOLD=${SIMILARITY_THRESHOLD:-0.15}
       - SPEAKER_SERVICE_HOST=0.0.0.0
-      - SPEAKER_SERVICE_PORT=8085
+      - SPEAKER_SERVICE_PORT=8086
       - DEEPGRAM_API_KEY=${DEEPGRAM_API_KEY}
       - CORS_ORIGINS=http://localhost:3001,http://localhost:8001,https://localhost:3001,https://localhost:8001
     restart: unless-stopped
     healthcheck:
-      test: ["CMD", "curl", "-f", "http://localhost:8085/health"]
+      test: ["CMD", "curl", "-f", "http://localhost:8086/health"]
       interval: 30s
       timeout: 10s
       retries: 3
diff --git a/extras/speaker-recognition/src/simple_speaker_recognition/api/routers/identification.py b/extras/speaker-recognition/src/simple_speaker_recognition/api/routers/identification.py
index e6c02e95..9e5e48cf 100644
--- a/extras/speaker-recognition/src/simple_speaker_recognition/api/routers/identification.py
+++ b/extras/speaker-recognition/src/simple_speaker_recognition/api/routers/identification.py
@@ -321,10 +321,14 @@ async def diarize_identify_match(
         transcript = json.loads(transcript_data)
         words = transcript.get("words", [])
     except json.JSONDecodeError as e:
-        raise HTTPException(400, f"Invalid transcript_data JSON: {str(e)}") from e
+        error_msg = f"Invalid transcript_data JSON: {str(e)}"
+        log.error(f"❌ {error_msg}")
+        raise HTTPException(400, error_msg) from e
 
     if not words:
-        raise HTTPException(400, "No words found in transcript_data")
+        error_msg = f"No words found in transcript_data (transcript keys: {list(transcript.keys())}, words type: {type(words)})"
+        log.error(f"❌ {error_msg}")
+        raise HTTPException(400, error_msg)
 
     # Get settings for chunking configuration
     from simple_speaker_recognition.api.service import auth as settings
diff --git a/tests/integration/websocket_transcription_e2e_test.robot b/tests/integration/websocket_transcription_e2e_test.robot
index 7b29a06d..3429b52f 100644
--- a/tests/integration/websocket_transcription_e2e_test.robot
+++ b/tests/integration/websocket_transcription_e2e_test.robot
@@ -80,7 +80,7 @@ Speech Detection Receives Transcription From Stream
 
     # Stream audio and close
     ${stream_id}=    Open Audio Stream    device_name=${device_name}
-    Send Audio Chunks To Stream    ${stream_id}    ${TEST_AUDIO_FILE}    num_chunks=200
+    Send Audio Chunks To Stream    ${stream_id}    ${TEST_AUDIO_FILE}    num_chunks=200    realtime_pacing=True
     Close Audio Stream    ${stream_id}
 
     # Wait for speech detection job to complete
@@ -120,7 +120,7 @@ Conversation Created With Valid Transcript
 
     # Stream audio (enough to trigger speech detection)
     ${stream_id}=    Open Audio Stream    device_name=${device_name}
-    Send Audio Chunks To Stream    ${stream_id}    ${TEST_AUDIO_FILE}    num_chunks=200
+    Send Audio Chunks To Stream    ${stream_id}    ${TEST_AUDIO_FILE}    num_chunks=200    realtime_pacing=True
     Close Audio Stream    ${stream_id}
 
     # DIAGNOSTIC: Verify speech detection job completes before checking for conversation
diff --git a/tests/mocks/__init__.py b/tests/mocks/__init__.py
new file mode 100644
index 00000000..472a0895
--- /dev/null
+++ b/tests/mocks/__init__.py
@@ -0,0 +1 @@
+"""Mock implementations for testing."""
diff --git a/tests/mocks/mock_speaker_client.py b/tests/mocks/mock_speaker_client.py
new file mode 100644
index 00000000..e53a556e
--- /dev/null
+++ b/tests/mocks/mock_speaker_client.py
@@ -0,0 +1,160 @@
+"""Mock speaker recognition client for testing without heavy ML dependencies."""
+
+import logging
+from typing import Dict, Optional
+
+logger = logging.getLogger(__name__)
+
+
+class MockSpeakerRecognitionClient:
+    """
+    Mock speaker recognition client that returns pre-computed segments.
+
+    Used in test environments to avoid running resource-intensive speaker
+    recognition service. Segments are based on test_data.py expectations.
+    """
+
+    # Map audio filenames to mock segment data
+    # Segments follow the structure expected by the backend:
+    # {
+    #   "start": float,          # Start time in seconds
+    #   "end": float,            # End time in seconds
+    #   "text": str,             # Transcript text for this segment
+    #   "speaker": int,          # Speaker label (0, 1, 2, etc.)
+    #   "identified_as": str,    # Speaker name or "Unknown"
+    #   "confidence": float      # Optional confidence score
+    # }
+
+    MOCK_SEGMENTS = {
+        "DIY_Experts_Glass_Blowing_16khz_mono_1min.wav": [
+            {
+                "start": 0.0,
+                "end": 10.08,
+                "speaker": 0,
+                "identified_as": "Unknown",
+                "text": "The pumpkin that'll last for forever. Finally. Does it count? Today, we're taking a glass blowing class.",
+                "confidence": 0.95
+            },
+            {
+                "start": 10.28,
+                "end": 20.255,
+                "speaker": 0,
+                "identified_as": "Unknown",
+                "text": "I'm sweating already. We've worked with a lot of materials before, but we've only scratched the surface",
+                "confidence": 0.93
+            },
+            {
+                "start": 20.455,
+                "end": 21.895,
+                "speaker": 1,
+                "identified_as": "Unknown",
+                "text": "when it comes to glass",
+                "confidence": 0.91
+            },
+            {
+                "start": 22.095,
+                "end": 23.615,
+                "speaker": 0,
+                "identified_as": "Unknown",
+                "text": "and that's because",
+                "confidence": 0.94
+            },
+            {
+                "start": 23.815,
+                "end": 28.135,
+                "speaker": 1,
+                "identified_as": "Unknown",
+                "text": "a little intimidating. We've got about 400 pounds",
+                "confidence": 0.92
+            },
+            {
+                "start": 28.335,
+                "end": 43.08,
+                "speaker": 0,
+                "identified_as": "Unknown",
+                "text": "of liquid glass in this furnace right here. Nick's gonna really help us out. Nick, I'm excited and nervous. Me too.",
+                "confidence": 0.96
+            },
+            {
+                "start": 43.28,
+                "end": 44.48,
+                "speaker": 1,
+                "identified_as": "Unknown",
+                "text": "So we're gonna",
+                "confidence": 0.90
+            },
+            {
+                "start": 44.68,
+                "end": 46.76,
+                "speaker": 0,
+                "identified_as": "Unknown",
+                "text": "make what's called a trumpet",
+                "confidence": 0.95
+            },
+            {
+                "start": 46.96,
+                "end": 50.24,
+                "speaker": 0,
+                "identified_as": "Unknown",
+                "text": "flower. We're using gravity as a tool.",
+                "confidence": 0.93
+            }
+        ]
+    }
+
+    def __init__(self):
+        """Initialize mock client."""
+        logger.info("🎤 Mock speaker recognition client initialized")
+
+    async def diarize_identify_match(
+        self,
+        conversation_id: str,
+        backend_token: str,
+        transcript_data: Dict,
+        user_id: Optional[str] = None
+    ) -> Dict:
+        """
+        Return pre-computed mock segments for known test audio files.
+
+        Args:
+            conversation_id: Not used in mock (audio filename derived from transcript)
+            backend_token: Not used in mock
+            transcript_data: Dict with 'text' and 'words' - used to identify audio file
+            user_id: Not used in mock
+
+        Returns:
+            Dictionary with 'segments' array matching speaker service format
+        """
+        logger.info(f"🎤 Mock speaker client processing conversation: {conversation_id[:12]}...")
+
+        # Try to identify which test audio this is from the transcript
+        transcript_text = transcript_data.get("text", "").lower()
+
+        # Match by transcript content
+        if "glass blowing" in transcript_text or "glass" in transcript_text:
+            filename = "DIY_Experts_Glass_Blowing_16khz_mono_1min.wav"
+            if filename in self.MOCK_SEGMENTS:
+                segments = self.MOCK_SEGMENTS[filename]
+                logger.info(f"🎤 Mock returning {len(segments)} segments for DIY Glass Blowing audio")
+                return {"segments": segments}
+
+        # Fallback: Create single generic segment
+        logger.warning(f"🎤 Mock: No pre-computed segments found, creating generic segment")
+
+        # Get duration from words if available
+        words = transcript_data.get("words", [])
+        if words:
+            duration = words[-1].get("end", 60.0)
+        else:
+            duration = 60.0
+
+        return {
+            "segments": [{
+                "start": 0.0,
+                "end": duration,
+                "speaker": 0,
+                "identified_as": "Unknown",
+                "text": transcript_data.get("text", ""),
+                "confidence": 0.85
+            }]
+        }
diff --git a/tests/setup/test_manager_keywords.robot b/tests/setup/test_manager_keywords.robot
index d306fa78..da415783 100644
--- a/tests/setup/test_manager_keywords.robot
+++ b/tests/setup/test_manager_keywords.robot
@@ -82,7 +82,7 @@ Clear Test Databases
 
     # Clear Redis queues and job registries (preserve worker registrations, failed and finished jobs)
     # Delete all rq:* keys except worker registrations (rq:worker:*), failed jobs (rq:failed:*), and finished jobs (rq:finished:*)
-    ${redis_clear_script}=    Set Variable    redis-cli --scan --pattern "rq:*" | grep -Ev "^rq:(worker|failed|finished)" | xargs -r redis-cli DEL; redis-cli --scan --pattern "audio:*" | xargs -r redis-cli DEL; redis-cli --scan --pattern "consumer:*" | xargs -r redis-cli DEL
+    ${redis_clear_script}=    Set Variable    redis-cli --scan --pattern "rq:*" | grep -Ev "^rq:(worker|failed|finished)" | xargs -r redis-cli DEL; redis-cli --scan --pattern "audio:*" | xargs -r redis-cli DEL; redis-cli --scan --pattern "consumer:*" | xargs -r redis-cli DEL; redis-cli --scan --pattern "transcription:*" | xargs -r redis-cli DEL
     Run Process    docker    exec    ${REDIS_CONTAINER}    sh    -c    ${redis_clear_script}    shell=True
     Log To Console    Redis queues and job registries cleared (worker registrations preserved)
 

From ef719b194e98e881fc3a911a8eb3af147dd85a71 Mon Sep 17 00:00:00 2001
From: Ankush Malaker <43288948+AnkushMalaker@users.noreply.github.com>
Date: Fri, 23 Jan 2026 05:00:37 +0000
Subject: [PATCH 11/14] Refactor audio chunk retrieval and enhance logging in
 audio processing

- Introduced logging for audio chunk requests to improve traceability.
- Replaced manual audio chunk processing with a dedicated `reconstruct_audio_segment` function for better clarity and efficiency.
- Improved error handling during audio reconstruction to provide more informative responses in case of failures.
- Cleaned up imports and removed redundant code related to audio chunk calculations.
---
 .../routers/modules/audio_routes.py           | 59 +++++--------------
 .../routers/modules/conversation_routes.py    |  9 +--
 2 files changed, 19 insertions(+), 49 deletions(-)

diff --git a/backends/advanced/src/advanced_omi_backend/routers/modules/audio_routes.py b/backends/advanced/src/advanced_omi_backend/routers/modules/audio_routes.py
index a9f09ac2..7cef955a 100644
--- a/backends/advanced/src/advanced_omi_backend/routers/modules/audio_routes.py
+++ b/backends/advanced/src/advanced_omi_backend/routers/modules/audio_routes.py
@@ -307,6 +307,10 @@ async def get_audio_chunk_range(
         401: If not authenticated
         400: If time range is invalid
     """
+    import logging
+    logger = logging.getLogger(__name__)
+    logger.info(f"🎵 Audio chunk request: conversation={conversation_id[:8]}..., start={start_time:.2f}s, end={end_time:.2f}s")
+
     # Try token param if header auth failed
     if not current_user and token:
         current_user = await get_user_from_token_param(token)
@@ -333,52 +337,17 @@ async def get_audio_chunk_range(
     if conversation.audio_total_duration and end_time > conversation.audio_total_duration:
         end_time = conversation.audio_total_duration
 
-    # Calculate which chunks are needed (each chunk is 10 seconds)
-    CHUNK_DURATION = 10.0
-    start_chunk = int(start_time / CHUNK_DURATION)
-    end_chunk = int(end_time / CHUNK_DURATION)
-    num_chunks = end_chunk - start_chunk + 1
-
-    # Retrieve only needed chunks
-    chunks = await retrieve_audio_chunks(
-        conversation_id=conversation_id,
-        start_index=start_chunk,
-        limit=num_chunks
-    )
-
-    if not chunks:
-        raise HTTPException(
-            status_code=404,
-            detail=f"No audio data in requested range ({start_time}s-{end_time}s)"
-        )
-
-    # Decode chunks and concatenate
-    pcm_buffer = await concatenate_chunks_to_pcm(chunks)
-
-    # Trim to exact time range within the chunks
-    SAMPLE_RATE = 16000
-    SAMPLE_WIDTH = 2  # 16-bit
-    CHANNELS = 1
-    bytes_per_second = SAMPLE_RATE * SAMPLE_WIDTH * CHANNELS
-
-    # Calculate byte offsets within concatenated buffer
-    start_offset_in_chunk = start_time - (start_chunk * CHUNK_DURATION)
-    end_offset_in_chunk = end_time - (end_chunk * CHUNK_DURATION)
+    # Use the dedicated segment reconstruction function
+    from advanced_omi_backend.utils.audio_chunk_utils import reconstruct_audio_segment
 
-    start_byte = int(start_offset_in_chunk * bytes_per_second)
-    # Calculate end byte from the end of buffer
-    bytes_from_end = int((CHUNK_DURATION - end_offset_in_chunk) * bytes_per_second)
-    end_byte = len(pcm_buffer) - bytes_from_end
-
-    # Trim PCM data
-    trimmed_pcm = pcm_buffer[start_byte:end_byte]
-
-    # Build WAV file with trimmed audio
-    wav_data = await build_wav_from_pcm(
-        pcm_data=trimmed_pcm,
-        sample_rate=SAMPLE_RATE,
-        channels=CHANNELS
-    )
+    try:
+        wav_data = await reconstruct_audio_segment(conversation_id, start_time, end_time)
+        logger.info(f"✅ Returning WAV: {len(wav_data)} bytes for range {start_time:.2f}s - {end_time:.2f}s")
+    except ValueError as e:
+        raise HTTPException(status_code=404, detail=str(e))
+    except Exception as e:
+        logger.error(f"Failed to reconstruct audio segment: {e}")
+        raise HTTPException(status_code=500, detail=f"Failed to reconstruct audio: {str(e)}")
 
     return StreamingResponse(
         io.BytesIO(wav_data),
diff --git a/backends/advanced/src/advanced_omi_backend/routers/modules/conversation_routes.py b/backends/advanced/src/advanced_omi_backend/routers/modules/conversation_routes.py
index be2b3bc4..997ab344 100644
--- a/backends/advanced/src/advanced_omi_backend/routers/modules/conversation_routes.py
+++ b/backends/advanced/src/advanced_omi_backend/routers/modules/conversation_routes.py
@@ -7,12 +7,13 @@
 import logging
 from typing import Optional
 
-from fastapi import APIRouter, Depends, Query, HTTPException, Response
+from fastapi import APIRouter, Depends, HTTPException, Query, Response
 
 from advanced_omi_backend.auth import current_active_user
-from advanced_omi_backend.controllers import conversation_controller, audio_controller
-from advanced_omi_backend.users import User
+from advanced_omi_backend.controllers import conversation_controller
 from advanced_omi_backend.models.conversation import Conversation
+from advanced_omi_backend.users import User
+from advanced_omi_backend.utils.audio_chunk_utils import reconstruct_audio_segment
 
 logger = logging.getLogger(__name__)
 
@@ -116,6 +117,7 @@ async def get_conversation_waveform(
         - duration_seconds: float - Total audio duration
     """
     from fastapi import HTTPException
+
     from advanced_omi_backend.models.conversation import Conversation
     from advanced_omi_backend.models.waveform import WaveformData
     from advanced_omi_backend.workers.waveform_jobs import generate_waveform_data
@@ -227,7 +229,6 @@ async def get_audio_segment(
     Returns:
         WAV audio bytes (16kHz, mono) for the requested time range
     """
-    from advanced_omi_backend.utils.audio_chunk_utils import reconstruct_audio_segment
 
     # Verify conversation exists and user has access
     conversation = await Conversation.find_one(

From bd1cd84251a84cdc60b3abda9c4281cb2a87eace Mon Sep 17 00:00:00 2001
From: Ankush Malaker <43288948+AnkushMalaker@users.noreply.github.com>
Date: Fri, 23 Jan 2026 05:10:44 +0000
Subject: [PATCH 12/14] Refactor mock speaker recognition client and improve
 testing structure

- Replaced direct import of mock client with a structured import from the new testing module.
- Introduced a dedicated `mock_speaker_client.py` to provide a mock implementation for speaker recognition, facilitating testing without heavy dependencies.
- Added an `__init__.py` file in the testing directory to organize testing utilities and mocks.
---
 .../speaker_recognition_client.py             |  12 +-
 .../advanced_omi_backend/testing/__init__.py  |   1 +
 .../testing/mock_speaker_client.py            | 160 ++++++++++++++++++
 3 files changed, 163 insertions(+), 10 deletions(-)
 create mode 100644 backends/advanced/src/advanced_omi_backend/testing/__init__.py
 create mode 100644 backends/advanced/src/advanced_omi_backend/testing/mock_speaker_client.py

diff --git a/backends/advanced/src/advanced_omi_backend/speaker_recognition_client.py b/backends/advanced/src/advanced_omi_backend/speaker_recognition_client.py
index d58b2a5d..b290efb1 100644
--- a/backends/advanced/src/advanced_omi_backend/speaker_recognition_client.py
+++ b/backends/advanced/src/advanced_omi_backend/speaker_recognition_client.py
@@ -39,16 +39,8 @@ def __init__(self, service_url: Optional[str] = None):
         # Check if we should use mock client (for testing)
         if os.getenv("USE_MOCK_SPEAKER_CLIENT") == "true":
             try:
-                # Import mock client from tests directory
-                import sys
-                from pathlib import Path
-
-                # Add tests directory to Python path
-                tests_dir = Path(__file__).resolve().parents[5] / "tests"
-                if str(tests_dir) not in sys.path:
-                    sys.path.insert(0, str(tests_dir))
-
-                from mocks.mock_speaker_client import MockSpeakerRecognitionClient
+                # Import mock client from testing module
+                from advanced_omi_backend.testing.mock_speaker_client import MockSpeakerRecognitionClient
 
                 self._mock_client = MockSpeakerRecognitionClient()
                 self.enabled = True
diff --git a/backends/advanced/src/advanced_omi_backend/testing/__init__.py b/backends/advanced/src/advanced_omi_backend/testing/__init__.py
new file mode 100644
index 00000000..8d430cdf
--- /dev/null
+++ b/backends/advanced/src/advanced_omi_backend/testing/__init__.py
@@ -0,0 +1 @@
+"""Testing utilities and mocks for Chronicle backend."""
diff --git a/backends/advanced/src/advanced_omi_backend/testing/mock_speaker_client.py b/backends/advanced/src/advanced_omi_backend/testing/mock_speaker_client.py
new file mode 100644
index 00000000..e53a556e
--- /dev/null
+++ b/backends/advanced/src/advanced_omi_backend/testing/mock_speaker_client.py
@@ -0,0 +1,160 @@
+"""Mock speaker recognition client for testing without heavy ML dependencies."""
+
+import logging
+from typing import Dict, Optional
+
+logger = logging.getLogger(__name__)
+
+
+class MockSpeakerRecognitionClient:
+    """
+    Mock speaker recognition client that returns pre-computed segments.
+
+    Used in test environments to avoid running resource-intensive speaker
+    recognition service. Segments are based on test_data.py expectations.
+    """
+
+    # Map audio filenames to mock segment data
+    # Segments follow the structure expected by the backend:
+    # {
+    #   "start": float,          # Start time in seconds
+    #   "end": float,            # End time in seconds
+    #   "text": str,             # Transcript text for this segment
+    #   "speaker": int,          # Speaker label (0, 1, 2, etc.)
+    #   "identified_as": str,    # Speaker name or "Unknown"
+    #   "confidence": float      # Optional confidence score
+    # }
+
+    MOCK_SEGMENTS = {
+        "DIY_Experts_Glass_Blowing_16khz_mono_1min.wav": [
+            {
+                "start": 0.0,
+                "end": 10.08,
+                "speaker": 0,
+                "identified_as": "Unknown",
+                "text": "The pumpkin that'll last for forever. Finally. Does it count? Today, we're taking a glass blowing class.",
+                "confidence": 0.95
+            },
+            {
+                "start": 10.28,
+                "end": 20.255,
+                "speaker": 0,
+                "identified_as": "Unknown",
+                "text": "I'm sweating already. We've worked with a lot of materials before, but we've only scratched the surface",
+                "confidence": 0.93
+            },
+            {
+                "start": 20.455,
+                "end": 21.895,
+                "speaker": 1,
+                "identified_as": "Unknown",
+                "text": "when it comes to glass",
+                "confidence": 0.91
+            },
+            {
+                "start": 22.095,
+                "end": 23.615,
+                "speaker": 0,
+                "identified_as": "Unknown",
+                "text": "and that's because",
+                "confidence": 0.94
+            },
+            {
+                "start": 23.815,
+                "end": 28.135,
+                "speaker": 1,
+                "identified_as": "Unknown",
+                "text": "a little intimidating. We've got about 400 pounds",
+                "confidence": 0.92
+            },
+            {
+                "start": 28.335,
+                "end": 43.08,
+                "speaker": 0,
+                "identified_as": "Unknown",
+                "text": "of liquid glass in this furnace right here. Nick's gonna really help us out. Nick, I'm excited and nervous. Me too.",
+                "confidence": 0.96
+            },
+            {
+                "start": 43.28,
+                "end": 44.48,
+                "speaker": 1,
+                "identified_as": "Unknown",
+                "text": "So we're gonna",
+                "confidence": 0.90
+            },
+            {
+                "start": 44.68,
+                "end": 46.76,
+                "speaker": 0,
+                "identified_as": "Unknown",
+                "text": "make what's called a trumpet",
+                "confidence": 0.95
+            },
+            {
+                "start": 46.96,
+                "end": 50.24,
+                "speaker": 0,
+                "identified_as": "Unknown",
+                "text": "flower. We're using gravity as a tool.",
+                "confidence": 0.93
+            }
+        ]
+    }
+
+    def __init__(self):
+        """Initialize mock client."""
+        logger.info("🎤 Mock speaker recognition client initialized")
+
+    async def diarize_identify_match(
+        self,
+        conversation_id: str,
+        backend_token: str,
+        transcript_data: Dict,
+        user_id: Optional[str] = None
+    ) -> Dict:
+        """
+        Return pre-computed mock segments for known test audio files.
+
+        Args:
+            conversation_id: Not used in mock (audio filename derived from transcript)
+            backend_token: Not used in mock
+            transcript_data: Dict with 'text' and 'words' - used to identify audio file
+            user_id: Not used in mock
+
+        Returns:
+            Dictionary with 'segments' array matching speaker service format
+        """
+        logger.info(f"🎤 Mock speaker client processing conversation: {conversation_id[:12]}...")
+
+        # Try to identify which test audio this is from the transcript
+        transcript_text = transcript_data.get("text", "").lower()
+
+        # Match by transcript content
+        if "glass blowing" in transcript_text or "glass" in transcript_text:
+            filename = "DIY_Experts_Glass_Blowing_16khz_mono_1min.wav"
+            if filename in self.MOCK_SEGMENTS:
+                segments = self.MOCK_SEGMENTS[filename]
+                logger.info(f"🎤 Mock returning {len(segments)} segments for DIY Glass Blowing audio")
+                return {"segments": segments}
+
+        # Fallback: Create single generic segment
+        logger.warning(f"🎤 Mock: No pre-computed segments found, creating generic segment")
+
+        # Get duration from words if available
+        words = transcript_data.get("words", [])
+        if words:
+            duration = words[-1].get("end", 60.0)
+        else:
+            duration = 60.0
+
+        return {
+            "segments": [{
+                "start": 0.0,
+                "end": duration,
+                "speaker": 0,
+                "identified_as": "Unknown",
+                "text": transcript_data.get("text", ""),
+                "confidence": 0.85
+            }]
+        }

From 0dfd90066dd3ec8895b47a853cf46afebe669783 Mon Sep 17 00:00:00 2001
From: Ankush Malaker <43288948+AnkushMalaker@users.noreply.github.com>
Date: Fri, 23 Jan 2026 13:40:16 +0000
Subject: [PATCH 13/14] Enhance conversation model to include word-level
 timestamps and improve transcript handling

- Added a new `words` field to the `Conversation` model for storing word-level timestamps.
- Updated methods to handle word data during transcript version creation, ensuring compatibility with speaker recognition.
- Refactored conversation job processing to utilize the new word structure, improving data integrity and access.
- Enhanced speaker recognition job to read words from the new standardized location, ensuring backward compatibility with legacy data.
---
 .../models/conversation.py                    | 17 ++++-
 .../workers/conversation_jobs.py              | 73 +++++--------------
 .../workers/speaker_jobs.py                   | 43 ++++++++++-
 .../workers/transcription_jobs.py             | 16 +++-
 4 files changed, 84 insertions(+), 65 deletions(-)

diff --git a/backends/advanced/src/advanced_omi_backend/models/conversation.py b/backends/advanced/src/advanced_omi_backend/models/conversation.py
index 28a2f0ec..1ee9a57a 100644
--- a/backends/advanced/src/advanced_omi_backend/models/conversation.py
+++ b/backends/advanced/src/advanced_omi_backend/models/conversation.py
@@ -63,7 +63,14 @@ class TranscriptVersion(BaseModel):
         """Version of a transcript with processing metadata."""
         version_id: str = Field(description="Unique version identifier")
         transcript: Optional[str] = Field(None, description="Full transcript text")
-        segments: List["Conversation.SpeakerSegment"] = Field(default_factory=list, description="Speaker segments")
+        words: List["Conversation.Word"] = Field(
+            default_factory=list,
+            description="Word-level timestamps for entire transcript"
+        )
+        segments: List["Conversation.SpeakerSegment"] = Field(
+            default_factory=list,
+            description="Speaker segments (filled by speaker recognition)"
+        )
         provider: Optional[str] = Field(None, description="Transcription provider used (deepgram, parakeet, etc.)")
         model: Optional[str] = Field(None, description="Model used (e.g., nova-3, parakeet)")
         created_at: datetime = Field(description="When this version was created")
@@ -253,8 +260,9 @@ def add_transcript_version(
         self,
         version_id: str,
         transcript: str,
-        segments: List["Conversation.SpeakerSegment"],
-        provider: str,  # Provider name from config.yml (deepgram, parakeet, etc.)
+        words: Optional[List["Conversation.Word"]] = None,
+        segments: Optional[List["Conversation.SpeakerSegment"]] = None,
+        provider: str = None,  # Provider name from config.yml (deepgram, parakeet, etc.)
         model: Optional[str] = None,
         processing_time_seconds: Optional[float] = None,
         metadata: Optional[Dict[str, Any]] = None,
@@ -264,7 +272,8 @@ def add_transcript_version(
         new_version = Conversation.TranscriptVersion(
             version_id=version_id,
             transcript=transcript,
-            segments=segments,
+            words=words or [],
+            segments=segments or [],
             provider=provider,
             model=model,
             created_at=datetime.now(),
diff --git a/backends/advanced/src/advanced_omi_backend/workers/conversation_jobs.py b/backends/advanced/src/advanced_omi_backend/workers/conversation_jobs.py
index 063d00b7..febdfbd8 100644
--- a/backends/advanced/src/advanced_omi_backend/workers/conversation_jobs.py
+++ b/backends/advanced/src/advanced_omi_backend/workers/conversation_jobs.py
@@ -588,74 +588,39 @@ async def open_conversation_job(
     # Create transcript version from streaming results
     version_id = f"streaming_{session_id[:12]}"
     transcript_text = final_transcript.get("text", "")
-    segments_data = final_transcript.get("segments", [])
-
-    # If streaming provider didn't provide segments (e.g., Deepgram streaming),
-    # create segments from individual final results with word-level data
-    if not segments_data:
-        logger.info(f"📝 No segments in streaming results, creating from word-level data")
-        results = await aggregator.get_session_results(session_id)
-
-        for result in results:
-            words = result.get("words", [])
-            text = result.get("text", "").strip()
-
-            # Skip empty results or results without timing data
-            # WARNING: We don't support results without word-level timing data.
-            # Ideally should error, but skipping for now to handle edge cases gracefully.
-            if not words or not text:
-                continue
-
-            # Create segment dict from this result chunk
-            # Each "final" result becomes one segment with generic speaker label
-            segment_dict = {
-                "start": words[0]["start"],
-                "end": words[-1]["end"],
-                "text": text,
-                "speaker": "SPEAKER_00",  # Generic label, updated by speaker recognition
-                "confidence": result.get("confidence"),
-                "words": words  # Already in correct format from aggregator
-            }
-            segments_data.append(segment_dict)
-
-        logger.info(f"✅ Created {len(segments_data)} segments from streaming results")
-
-    # Convert segments to SpeakerSegment format with word-level timestamps
-    segments = [
-        Conversation.SpeakerSegment(
-            start=seg.get("start", 0.0),
-            end=seg.get("end", 0.0),
-            text=seg.get("text", ""),
-            speaker=seg.get("speaker", "SPEAKER_00"),
-            confidence=seg.get("confidence"),
-            words=[
-                Conversation.Word(
-                    word=w.get("word", ""),
-                    start=w.get("start", 0.0),
-                    end=w.get("end", 0.0),
-                    confidence=w.get("confidence")
-                )
-                for w in seg.get("words", [])
-            ]
+    words_data = final_transcript.get("words", [])  # All words from aggregator
+
+    # Convert words to Word objects
+    words = [
+        Conversation.Word(
+            word=w.get("word", ""),
+            start=w.get("start", 0.0),
+            end=w.get("end", 0.0),
+            confidence=w.get("confidence")
         )
-        for seg in segments_data
+        for w in words_data
     ]
 
+    # Segments remain EMPTY until speaker recognition service processes them
+    # Per Chronicle architecture: segments ONLY come from speaker service
+    segments = []
+
     # Determine provider from streaming results
     provider = final_transcript.get("provider", "deepgram")
 
-    # Add streaming transcript as the initial version
+    # Add streaming transcript with words at version level
     conversation.add_transcript_version(
         version_id=version_id,
         transcript=transcript_text,
-        segments=segments,
+        words=words,  # Store at version level
+        segments=segments,  # Empty - only speaker service creates segments
         provider=provider,
         model=provider,  # Provider name as model
         processing_time_seconds=None,  # Not applicable for streaming
         metadata={
             "source": "streaming",
             "chunk_count": final_transcript.get("chunk_count", 0),
-            "word_count": len(final_transcript.get("words", []))
+            "word_count": len(words),
         },
         set_as_active=True
     )
@@ -664,7 +629,7 @@ async def open_conversation_job(
     await conversation.save()
     logger.info(
         f"✅ Saved streaming transcript: {len(transcript_text)} chars, "
-        f"{len(segments)} segments, {len(final_transcript.get('words', []))} words "
+        f"{len(segments)} segments (empty until speaker recognition), {len(words)} words "
         f"for conversation {conversation_id[:12]}"
     )
 
diff --git a/backends/advanced/src/advanced_omi_backend/workers/speaker_jobs.py b/backends/advanced/src/advanced_omi_backend/workers/speaker_jobs.py
index 338bdf4b..729ba3b3 100644
--- a/backends/advanced/src/advanced_omi_backend/workers/speaker_jobs.py
+++ b/backends/advanced/src/advanced_omi_backend/workers/speaker_jobs.py
@@ -207,11 +207,36 @@ async def recognise_speakers_job(
     actual_transcript_text = transcript_text or transcript_version.transcript or ""
     actual_words = words if words else []
 
-    # If words not provided, read from transcript version metadata
-    # (Transcription job stores words in metadata since segments are created by speaker service)
-    if not actual_words and transcript_version.metadata:
+    # If words not provided as parameter, read from version.words field (standardized location)
+    if not actual_words and transcript_version.words:
+        # Convert Word objects to dicts for speaker service API
+        actual_words = [
+            {
+                "word": w.word,
+                "start": w.start,
+                "end": w.end,
+                "confidence": w.confidence
+            }
+            for w in transcript_version.words
+        ]
+        logger.info(f"🔤 Loaded {len(actual_words)} words from transcript version.words field")
+    # Backward compatibility: Fall back to metadata if words field is empty (old data)
+    elif not actual_words and transcript_version.metadata.get("words"):
         actual_words = transcript_version.metadata.get("words", [])
-        logger.info(f"🔤 Loaded {len(actual_words)} words from transcript version metadata")
+        logger.info(f"🔤 Loaded {len(actual_words)} words from transcript version metadata (legacy)")
+    # Backward compatibility: Extract from segments if that's all we have (old streaming data)
+    elif not actual_words and transcript_version.segments:
+        for segment in transcript_version.segments:
+            if segment.words:
+                for w in segment.words:
+                    actual_words.append({
+                        "word": w.word,
+                        "start": w.start,
+                        "end": w.end,
+                        "confidence": w.confidence
+                    })
+        if actual_words:
+            logger.info(f"🔤 Extracted {len(actual_words)} words from segments (legacy)")
 
     if not actual_transcript_text:
         logger.warning(f"🎤 No transcript text found in version {version_id}")
@@ -223,6 +248,16 @@ async def recognise_speakers_job(
             "processing_time_seconds": 0
         }
 
+    if not actual_words:
+        logger.warning(f"🎤 No words found in version {version_id}")
+        return {
+            "success": False,
+            "conversation_id": conversation_id,
+            "version_id": version_id,
+            "error": "No word-level timing data available",
+            "processing_time_seconds": 0
+        }
+
     transcript_data = {
         "text": actual_transcript_text,
         "words": actual_words
diff --git a/backends/advanced/src/advanced_omi_backend/workers/transcription_jobs.py b/backends/advanced/src/advanced_omi_backend/workers/transcription_jobs.py
index 3d5aef5f..a3676383 100644
--- a/backends/advanced/src/advanced_omi_backend/workers/transcription_jobs.py
+++ b/backends/advanced/src/advanced_omi_backend/workers/transcription_jobs.py
@@ -365,20 +365,30 @@ async def transcribe_full_audio_job(
     # Add new transcript version
     provider_normalized = provider_name.lower() if provider_name else "unknown"
 
+    # Convert words to Word objects
+    word_objects = [
+        Conversation.Word(
+            word=w.get("word", ""),
+            start=w.get("start", 0.0),
+            end=w.get("end", 0.0),
+            confidence=w.get("confidence")
+        )
+        for w in words
+    ]
+
     # Prepare metadata (transcription only - speaker service will add segments and metadata)
-    # Store words in metadata so speaker job can access them
     metadata = {
         "trigger": trigger,
         "audio_file_size": len(wav_data),
         "word_count": len(words),
         "segments_created_by": "speaker_service",  # Speaker service creates segments via diarization
-        "words": words,  # Store word-level timing data for speaker job
     }
 
     conversation.add_transcript_version(
         version_id=version_id,
         transcript=transcript_text,
-        segments=speaker_segments,
+        words=word_objects,  # Store at version level (not in metadata!)
+        segments=speaker_segments,  # Empty - will be filled by speaker recognition
         provider=provider_normalized,  # Now just a string, no enum constructor needed
         model=provider.name,
         processing_time_seconds=processing_time,

From 7df727f81e24dff1406806158811dae7424bed7d Mon Sep 17 00:00:00 2001
From: Ankush Malaker <43288948+AnkushMalaker@users.noreply.github.com>
Date: Fri, 23 Jan 2026 16:21:20 +0000
Subject: [PATCH 14/14] Implement speaker reprocessing feature and enhance
 timeout calculation

- Added a new endpoint to reprocess speaker identification for existing transcripts, creating a new version with re-identified speakers.
- Introduced a method to calculate proportional timeouts based on audio duration, improving handling of varying audio lengths.
- Updated the speaker recognition client to utilize calculated timeouts during service calls, enhancing responsiveness.
- Refactored conversation and memory controllers to support the new speaker reprocessing functionality, ensuring user access control and job chaining for memory updates.
- Removed unfiltered memory retrieval endpoint to streamline memory management and focus on user-specific data access.
---
 .../controllers/conversation_controller.py    | 166 ++++++++++++++++++
 .../controllers/memory_controller.py          |  27 ---
 .../routers/modules/conversation_routes.py    |  26 +++
 .../routers/modules/memory_routes.py          |  10 --
 .../speaker_recognition_client.py             |  62 ++++++-
 .../workers/speaker_jobs.py                   |  76 ++++++--
 .../webui/src/pages/Conversations.tsx         |  51 ++++++
 .../advanced/webui/src/pages/Memories.tsx     |  24 +--
 backends/advanced/webui/src/services/api.ts   |  10 +-
 extras/speaker-recognition/.env.template      |  16 ++
 extras/speaker-recognition/init.py            |  13 +-
 .../api/routers/identification.py             |  84 +++++++--
 12 files changed, 479 insertions(+), 86 deletions(-)

diff --git a/backends/advanced/src/advanced_omi_backend/controllers/conversation_controller.py b/backends/advanced/src/advanced_omi_backend/controllers/conversation_controller.py
index f8afaf9d..e6aac85a 100644
--- a/backends/advanced/src/advanced_omi_backend/controllers/conversation_controller.py
+++ b/backends/advanced/src/advanced_omi_backend/controllers/conversation_controller.py
@@ -561,6 +561,172 @@ async def reprocess_memory(conversation_id: str, transcript_version_id: str, use
         return JSONResponse(status_code=500, content={"error": "Error starting memory reprocessing"})
 
 
+async def reprocess_speakers(
+    conversation_id: str,
+    transcript_version_id: str,
+    user: User
+):
+    """
+    Reprocess speaker identification for a specific transcript version.
+    Users can only reprocess their own conversations.
+
+    Creates NEW transcript version with same text/words but re-identified speakers.
+    Automatically chains memory reprocessing since speaker attribution affects meaning.
+    """
+    try:
+        # 1. Find conversation and validate ownership
+        conversation_model = await Conversation.find_one(
+            Conversation.conversation_id == conversation_id
+        )
+        if not conversation_model:
+            return JSONResponse(
+                status_code=404,
+                content={"error": "Conversation not found"}
+            )
+
+        # Check ownership for non-admin users
+        if not user.is_superuser and conversation_model.user_id != str(user.user_id):
+            return JSONResponse(
+                status_code=403,
+                content={"error": "Access forbidden. You can only reprocess your own conversations."}
+            )
+
+        # 2. Resolve source transcript version ID (handle "active" special case)
+        source_version_id = transcript_version_id
+        if source_version_id == "active":
+            active_version_id = conversation_model.active_transcript_version
+            if not active_version_id:
+                return JSONResponse(
+                    status_code=404,
+                    content={"error": "No active transcript version found"}
+                )
+            source_version_id = active_version_id
+
+        # 3. Find and validate the source transcript version
+        source_version = None
+        for version in conversation_model.transcript_versions:
+            if version.version_id == source_version_id:
+                source_version = version
+                break
+
+        if not source_version:
+            return JSONResponse(
+                status_code=404,
+                content={"error": f"Transcript version '{source_version_id}' not found"}
+            )
+
+        # 4. Validate transcript has content and words
+        if not source_version.transcript:
+            return JSONResponse(
+                status_code=400,
+                content={"error": "Cannot re-diarize empty transcript. Transcript version has no text."}
+            )
+
+        if not source_version.words:
+            return JSONResponse(
+                status_code=400,
+                content={"error": "Cannot re-diarize transcript without word timings. Words are required for diarization."}
+            )
+
+        # 5. Check if speaker recognition is enabled
+        speaker_config = get_service_config('speaker_recognition')
+        if not speaker_config.get('enabled', True):
+            return JSONResponse(
+                status_code=400,
+                content={
+                    "error": "Speaker recognition is disabled",
+                    "details": "Enable speaker service in config to use this feature"
+                }
+            )
+
+        # 6. Create NEW transcript version (copy text/words, empty segments)
+        new_version_id = str(uuid.uuid4())
+
+        # Add new version with copied text/words but empty segments
+        # Speaker job will populate segments with re-identified speakers
+        conversation_model.add_transcript_version(
+            version_id=new_version_id,
+            transcript=source_version.transcript,  # COPY transcript text
+            words=source_version.words,  # COPY word timings
+            segments=[],  # Empty - will be populated by speaker job
+            provider=source_version.provider,
+            model=source_version.model,
+            processing_time_seconds=None,  # Will be updated by job
+            metadata={
+                "reprocessing_type": "speaker_diarization",
+                "source_version_id": source_version_id,
+                "trigger": "manual_reprocess"
+            },
+            set_as_active=True  # Set new version as active
+        )
+
+        # Save conversation with new version
+        await conversation_model.save()
+
+        logger.info(
+            f"Created new transcript version {new_version_id} from source {source_version_id} "
+            f"for conversation {conversation_id}"
+        )
+
+        # 7. Enqueue speaker recognition job with NEW version_id
+        speaker_job = transcription_queue.enqueue(
+            recognise_speakers_job,
+            conversation_id,
+            new_version_id,  # NEW version (not source)
+            job_timeout=1200,  # 20 minutes
+            result_ttl=JOB_RESULT_TTL,
+            job_id=f"reprocess_speaker_{conversation_id[:12]}",
+            description=f"Re-diarize speakers for {conversation_id[:8]}",
+            meta={
+                'conversation_id': conversation_id,
+                'version_id': new_version_id,
+                'source_version_id': source_version_id,
+                'trigger': 'reprocess'
+            }
+        )
+
+        logger.info(
+            f"Enqueued speaker reprocessing job {speaker_job.id} "
+            f"for new version {new_version_id}"
+        )
+
+        # 8. Chain memory reprocessing (speaker changes affect memory context)
+        memory_job = memory_queue.enqueue(
+            process_memory_job,
+            conversation_id,
+            depends_on=speaker_job,
+            job_timeout=1800,  # 30 minutes
+            result_ttl=JOB_RESULT_TTL,
+            job_id=f"memory_{conversation_id[:12]}",
+            description=f"Extract memories for {conversation_id[:8]}",
+            meta={
+                'conversation_id': conversation_id,
+                'trigger': 'reprocess_after_speaker'
+            }
+        )
+
+        logger.info(
+            f"Chained memory reprocessing job {memory_job.id} "
+            f"after speaker job {speaker_job.id}"
+        )
+
+        # 9. Return job information
+        return JSONResponse(content={
+            "message": "Speaker reprocessing started",
+            "job_id": speaker_job.id,
+            "version_id": new_version_id,  # NEW version ID
+            "source_version_id": source_version_id,  # Original version used as source
+            "status": "queued"
+        })
+
+    except Exception as e:
+        logger.error(f"Error starting speaker reprocessing: {e}")
+        return JSONResponse(
+            status_code=500,
+            content={"error": "Error starting speaker reprocessing"}
+        )
+
+
 async def activate_transcript_version(conversation_id: str, version_id: str, user: User):
     """Activate a specific transcript version. Users can only modify their own conversations."""
     try:
diff --git a/backends/advanced/src/advanced_omi_backend/controllers/memory_controller.py b/backends/advanced/src/advanced_omi_backend/controllers/memory_controller.py
index f52167de..5abf4b36 100644
--- a/backends/advanced/src/advanced_omi_backend/controllers/memory_controller.py
+++ b/backends/advanced/src/advanced_omi_backend/controllers/memory_controller.py
@@ -139,33 +139,6 @@ async def delete_memory(memory_id: str, user: User):
         )
 
 
-async def get_memories_unfiltered(user: User, limit: int, user_id: Optional[str] = None):
-    """Get all memories including fallback transcript memories (for debugging). Users see only their own memories, admins can see all or filter by user."""
-    try:
-        memory_service = get_memory_service()
-
-        # Determine which user's memories to fetch
-        target_user_id = user.user_id
-        if user.is_superuser and user_id:
-            target_user_id = user_id
-
-        # Execute memory retrieval directly (now async)
-        memories = await memory_service.get_all_memories_unfiltered(target_user_id, limit)
-
-        return {
-            "memories": memories,
-            "count": len(memories),
-            "user_id": target_user_id,
-            "includes_fallback": True,
-        }
-
-    except Exception as e:
-        audio_logger.error(f"Error fetching unfiltered memories: {e}", exc_info=True)
-        return JSONResponse(
-            status_code=500, content={"message": f"Error fetching unfiltered memories: {str(e)}"}
-        )
-
-
 async def add_memory(content: str, user: User, source_id: Optional[str] = None):
     """Add a memory directly from content text. Extracts structured memories from the provided content."""
     try:
diff --git a/backends/advanced/src/advanced_omi_backend/routers/modules/conversation_routes.py b/backends/advanced/src/advanced_omi_backend/routers/modules/conversation_routes.py
index 997ab344..25f494ce 100644
--- a/backends/advanced/src/advanced_omi_backend/routers/modules/conversation_routes.py
+++ b/backends/advanced/src/advanced_omi_backend/routers/modules/conversation_routes.py
@@ -66,6 +66,32 @@ async def reprocess_memory(
     return await conversation_controller.reprocess_memory(conversation_id, transcript_version_id, current_user)
 
 
+@router.post("/{conversation_id}/reprocess-speakers")
+async def reprocess_speakers(
+    conversation_id: str,
+    current_user: User = Depends(current_active_user),
+    transcript_version_id: str = Query(default="active")
+):
+    """
+    Re-run speaker identification/diarization on existing transcript.
+
+    Creates a NEW transcript version with same text/words but re-identified speakers.
+    Automatically chains memory reprocessing since speaker changes affect memory context.
+
+    Args:
+        conversation_id: Conversation to reprocess
+        transcript_version_id: Which transcript version to use as source (default: "active")
+
+    Returns:
+        Job status with job_id and new version_id
+    """
+    return await conversation_controller.reprocess_speakers(
+        conversation_id,
+        transcript_version_id,
+        current_user
+    )
+
+
 @router.post("/{conversation_id}/activate-transcript/{version_id}")
 async def activate_transcript_version(
     conversation_id: str,
diff --git a/backends/advanced/src/advanced_omi_backend/routers/modules/memory_routes.py b/backends/advanced/src/advanced_omi_backend/routers/modules/memory_routes.py
index d0be9528..185f55ec 100644
--- a/backends/advanced/src/advanced_omi_backend/routers/modules/memory_routes.py
+++ b/backends/advanced/src/advanced_omi_backend/routers/modules/memory_routes.py
@@ -72,16 +72,6 @@ async def delete_memory(memory_id: str, current_user: User = Depends(current_act
     return await memory_controller.delete_memory(memory_id, current_user)
 
 
-@router.get("/unfiltered")
-async def get_memories_unfiltered(
-    current_user: User = Depends(current_active_user),
-    limit: int = Query(default=50, ge=1, le=1000),
-    user_id: Optional[str] = Query(default=None, description="User ID filter (admin only)"),
-):
-    """Get all memories including fallback transcript memories (for debugging). Users see only their own memories, admins can see all or filter by user."""
-    return await memory_controller.get_memories_unfiltered(current_user, limit, user_id)
-
-
 @router.get("/admin")
 async def get_all_memories_admin(current_user: User = Depends(current_superuser), limit: int = 200):
     """Get all memories across all users for admin review. Admin only."""
diff --git a/backends/advanced/src/advanced_omi_backend/speaker_recognition_client.py b/backends/advanced/src/advanced_omi_backend/speaker_recognition_client.py
index b290efb1..772ae33c 100644
--- a/backends/advanced/src/advanced_omi_backend/speaker_recognition_client.py
+++ b/backends/advanced/src/advanced_omi_backend/speaker_recognition_client.py
@@ -81,6 +81,35 @@ def __init__(self, service_url: Optional[str] = None):
         else:
             logger.info("Speaker recognition client disabled (no service URL configured)")
 
+    def calculate_timeout(self, audio_duration: Optional[float]) -> float:
+        """
+        Calculate proportional timeout based on audio duration.
+
+        Uses the formula: timeout = min(MAX_TIMEOUT, audio_duration * MULTIPLIER + BASE_TIMEOUT)
+
+        Args:
+            audio_duration: Duration of audio in seconds
+
+        Returns:
+            Calculated timeout in seconds
+        """
+        BASE_TIMEOUT = 30.0  # Minimum timeout for short files
+        TIMEOUT_MULTIPLIER = 8.0  # Processing speed ratio (e.g., 1 min audio = 8 min timeout)
+        MAX_TIMEOUT = 600.0  # 10 minute cap for very long files
+
+        if audio_duration is None or audio_duration <= 0:
+            logger.warning("Audio duration unknown or invalid, using base timeout")
+            return BASE_TIMEOUT
+
+        calculated_timeout = audio_duration * TIMEOUT_MULTIPLIER + BASE_TIMEOUT
+        timeout = min(MAX_TIMEOUT, calculated_timeout)
+
+        logger.info(
+            f"🕐 Calculated timeout: audio_duration={audio_duration:.1f}s → "
+            f"timeout={timeout:.1f}s (base={BASE_TIMEOUT}, multiplier={TIMEOUT_MULTIPLIER}, max={MAX_TIMEOUT})"
+        )
+        return timeout
+
     async def diarize_identify_match(
         self,
         conversation_id: str,
@@ -113,6 +142,14 @@ async def diarize_identify_match(
             logger.info(f"🎤 Speaker recognition disabled, returning empty result")
             return {"segments": []}
 
+        # Fetch conversation to get audio duration for timeout calculation
+        from advanced_omi_backend.models.conversation import Conversation
+        conversation = await Conversation.find_one(Conversation.conversation_id == conversation_id)
+        audio_duration = conversation.audio_total_duration if conversation else None
+
+        # Calculate proportional timeout based on audio duration
+        timeout = self.calculate_timeout(audio_duration)
+
         try:
             logger.info(f"🎤 Calling speaker service with conversation_id: {conversation_id[:12]}...")
 
@@ -172,7 +209,7 @@ async def diarize_identify_match(
                 async with session.post(
                     request_url,
                     data=form_data,
-                    timeout=aiohttp.ClientTimeout(total=120),
+                    timeout=aiohttp.ClientTimeout(total=timeout),
                 ) as response:
                     logger.info(f"🎤 Speaker service response status: {response.status}")
 
@@ -231,6 +268,11 @@ async def diarize_and_identify(
                 f"({len(audio_data) / 1024 / 1024:.2f} MB)"
             )
 
+            # Estimate audio duration from data size (assuming 16kHz, 16-bit PCM)
+            # WAV header is typically 44 bytes
+            estimated_duration = (len(audio_data) - 44) / 32000  # 16000 Hz * 2 bytes per sample
+            timeout = self.calculate_timeout(estimated_duration)
+
             # Call the speaker recognition service
             async with aiohttp.ClientSession() as session:
                 # Prepare the audio data for upload (no disk I/O!)
@@ -277,7 +319,7 @@ async def diarize_and_identify(
                 async with session.post(
                     endpoint_url,
                     data=form_data,
-                    timeout=aiohttp.ClientTimeout(total=120),
+                    timeout=aiohttp.ClientTimeout(total=timeout),
                 ) as response:
                     logger.info(f"🎤 [DIARIZE] Response status: {response.status}")
 
@@ -346,6 +388,20 @@ async def identify_speakers(self, audio_path: str, segments: List[Dict]) -> Dict
 
             logger.info(f"Identifying {len(unique_speakers)} speakers in {audio_path}")
 
+            # Get audio duration for timeout calculation
+            import wave
+            try:
+                with wave.open(audio_path, "rb") as wav_file:
+                    frame_count = wav_file.getnframes()
+                    sample_rate = wav_file.getframerate()
+                    audio_duration = frame_count / sample_rate if sample_rate > 0 else None
+            except Exception as e:
+                logger.warning(f"Failed to get audio duration from {audio_path}: {e}")
+                audio_duration = None
+
+            # Calculate proportional timeout based on audio duration
+            timeout = self.calculate_timeout(audio_duration)
+
             # Call the speaker recognition service
             async with aiohttp.ClientSession() as session:
                 # Prepare the audio file for upload
@@ -374,7 +430,7 @@ async def identify_speakers(self, audio_path: str, segments: List[Dict]) -> Dict
                     async with session.post(
                         f"{self.service_url}/diarize-and-identify",
                         data=form_data,
-                        timeout=aiohttp.ClientTimeout(total=120),
+                        timeout=aiohttp.ClientTimeout(total=timeout),
                     ) as response:
                         if response.status != 200:
                             logger.warning(
diff --git a/backends/advanced/src/advanced_omi_backend/workers/speaker_jobs.py b/backends/advanced/src/advanced_omi_backend/workers/speaker_jobs.py
index 729ba3b3..d9adbada 100644
--- a/backends/advanced/src/advanced_omi_backend/workers/speaker_jobs.py
+++ b/backends/advanced/src/advanced_omi_backend/workers/speaker_jobs.py
@@ -315,33 +315,61 @@ async def recognise_speakers_job(
             error_message = speaker_result.get("message", "Unknown error")
             logger.error(f"🎤 Speaker recognition service error: {error_type} - {error_message}")
 
-            # For connection failures, skip speaker recognition but allow downstream jobs to proceed
-            # Speaker recognition is optional - memory extraction and other jobs should still run
+            # Connection/timeout errors → skip gracefully (existing behavior)
             if error_type in ("connection_failed", "timeout", "client_error"):
                 logger.warning(
                     f"⚠️ Speaker service unavailable ({error_type}), skipping speaker recognition. "
                     f"Downstream jobs (memory, title/summary, events) will proceed normally."
                 )
                 return {
-                    "success": True,
+                    "success": True,  # Allow pipeline to continue
                     "conversation_id": conversation_id,
                     "version_id": version_id,
                     "speaker_recognition_enabled": True,
                     "speaker_service_unavailable": True,
                     "identified_speakers": [],
                     "skip_reason": f"Speaker service unavailable: {error_type}",
+                    "error_type": error_type,
                     "processing_time_seconds": time.time() - start_time
                 }
 
-            # For other errors (e.g., processing errors), return error dict without failing
-            return {
-                "success": False,
-                "conversation_id": conversation_id,
-                "version_id": version_id,
-                "error": f"Speaker recognition failed: {error_type}",
-                "error_details": error_message,
-                "processing_time_seconds": time.time() - start_time
-            }
+            # Validation errors → fail job, don't retry
+            elif error_type == "validation_error":
+                logger.error(f"❌ Speaker service validation error: {error_message}")
+                return {
+                    "success": False,
+                    "conversation_id": conversation_id,
+                    "version_id": version_id,
+                    "error": f"Validation error: {error_message}",
+                    "error_type": error_type,
+                    "retryable": False,  # Don't retry validation errors
+                    "processing_time_seconds": time.time() - start_time
+                }
+
+            # Resource errors → fail job, can retry later
+            elif error_type == "resource_error":
+                logger.error(f"❌ Speaker service resource error: {error_message}")
+                return {
+                    "success": False,
+                    "conversation_id": conversation_id,
+                    "version_id": version_id,
+                    "error": f"Resource error: {error_message}",
+                    "error_type": error_type,
+                    "retryable": True,  # Can retry later when resources available
+                    "processing_time_seconds": time.time() - start_time
+                }
+
+            # Unknown errors → fail job
+            else:
+                return {
+                    "success": False,
+                    "conversation_id": conversation_id,
+                    "version_id": version_id,
+                    "error": f"Speaker recognition failed: {error_type}",
+                    "error_details": error_message,
+                    "error_type": error_type,
+                    "processing_time_seconds": time.time() - start_time
+                }
 
         # Service worked but found no segments (legitimate empty result)
         if not speaker_result or "segments" not in speaker_result or not speaker_result["segments"]:
@@ -443,6 +471,30 @@ async def recognise_speakers_job(
             "processing_time_seconds": processing_time
         }
 
+    except asyncio.TimeoutError as e:
+        logger.error(f"❌ Speaker recognition timeout: {e}")
+
+        # Add timeout metadata to job
+        from rq import get_current_job
+        current_job = get_current_job()
+        if current_job:
+            current_job.meta.update({
+                "error_type": "timeout",
+                "audio_duration": conversation.audio_total_duration if conversation else None,
+                "timeout_occurred_at": time.time()
+            })
+            current_job.save_meta()
+
+        return {
+            "success": False,
+            "conversation_id": conversation_id,
+            "version_id": version_id,
+            "error": "Speaker recognition timeout",
+            "error_type": "timeout",
+            "audio_duration": conversation.audio_total_duration if conversation else None,
+            "processing_time_seconds": time.time() - start_time
+        }
+
     except Exception as speaker_error:
         logger.error(f"❌ Speaker recognition failed: {speaker_error}")
         import traceback
diff --git a/backends/advanced/webui/src/pages/Conversations.tsx b/backends/advanced/webui/src/pages/Conversations.tsx
index 4f3e1b2e..ca613702 100644
--- a/backends/advanced/webui/src/pages/Conversations.tsx
+++ b/backends/advanced/webui/src/pages/Conversations.tsx
@@ -68,6 +68,7 @@ export default function Conversations() {
   const [openDropdown, setOpenDropdown] = useState<string | null>(null)
   const [reprocessingTranscript, setReprocessingTranscript] = useState<Set<string>>(new Set())
   const [reprocessingMemory, setReprocessingMemory] = useState<Set<string>>(new Set())
+  const [reprocessingSpeakers, setReprocessingSpeakers] = useState<Set<string>>(new Set())
   const [deletingConversation, setDeletingConversation] = useState<Set<string>>(new Set())
 
   // Transcript segment editing state
@@ -246,6 +247,40 @@ export default function Conversations() {
     }
   }
 
+  const handleReprocessSpeakers = async (conversation: Conversation) => {
+    try {
+      if (!conversation.conversation_id) {
+        setError('Cannot reprocess speakers: Conversation ID is missing. This conversation may be from an older format.')
+        return
+      }
+
+      setReprocessingSpeakers(prev => new Set(prev).add(conversation.conversation_id!))
+      setOpenDropdown(null)
+
+      const response = await conversationsApi.reprocessSpeakers(
+        conversation.conversation_id,
+        'active'  // Use active transcript version as source
+      )
+
+      if (response.status === 200) {
+        // Refresh conversations to show new version with updated speakers
+        await loadConversations()
+      } else {
+        setError(`Failed to start speaker reprocessing: ${response.data?.error || 'Unknown error'}`)
+      }
+    } catch (err: any) {
+      setError(`Error starting speaker reprocessing: ${err.message || 'Unknown error'}`)
+    } finally {
+      if (conversation.conversation_id) {
+        setReprocessingSpeakers(prev => {
+          const newSet = new Set(prev)
+          newSet.delete(conversation.conversation_id!)
+          return newSet
+        })
+      }
+    }
+  }
+
   const handleDeleteConversation = async (conversationId: string) => {
     try {
       const confirmed = window.confirm('Are you sure you want to delete this conversation? This action cannot be undone.')
@@ -695,6 +730,22 @@ export default function Conversations() {
                           <span className="text-xs text-red-500 ml-1">(ID missing)</span>
                         )}
                       </button>
+                      <button
+                        onClick={() => handleReprocessSpeakers(conversation)}
+                        disabled={!conversation.conversation_id || reprocessingSpeakers.has(conversation.conversation_id)}
+                        className="w-full text-left px-4 py-2 text-sm text-gray-700 dark:text-gray-300 hover:bg-gray-100 dark:hover:bg-gray-700 flex items-center space-x-2 disabled:opacity-50 disabled:cursor-not-allowed"
+                        title="Create new transcript version with re-identified speakers (automatically updates memories)"
+                      >
+                        {conversation.conversation_id && reprocessingSpeakers.has(conversation.conversation_id) ? (
+                          <RefreshCw className="h-4 w-4 animate-spin" />
+                        ) : (
+                          <User className="h-4 w-4" />
+                        )}
+                        <span>Reprocess Who Spoke</span>
+                        {!conversation.conversation_id && (
+                          <span className="text-xs text-red-500 ml-1">(ID missing)</span>
+                        )}
+                      </button>
                       <div className="border-t border-gray-200 dark:border-gray-600 my-1"></div>
                       <button
                         onClick={() => conversation.conversation_id && handleDeleteConversation(conversation.conversation_id)}
diff --git a/backends/advanced/webui/src/pages/Memories.tsx b/backends/advanced/webui/src/pages/Memories.tsx
index 9c488e85..77daca51 100644
--- a/backends/advanced/webui/src/pages/Memories.tsx
+++ b/backends/advanced/webui/src/pages/Memories.tsx
@@ -24,7 +24,6 @@ export default function Memories() {
   const [loading, setLoading] = useState(false)
   const [error, setError] = useState<string | null>(null)
   const [searchQuery, setSearchQuery] = useState('')
-  const [showUnfiltered, setShowUnfiltered] = useState(false)
   const [totalCount, setTotalCount] = useState<number | null>(null)
 
   // Semantic search state
@@ -61,9 +60,7 @@ export default function Memories() {
 
     try {
       setLoading(true)
-      const response = showUnfiltered
-        ? await memoriesApi.getUnfiltered(user.id)
-        : await memoriesApi.getAll(user.id)
+      const response = await memoriesApi.getAll(user.id)
 
       console.log('🧠 Memories API response:', response.data)
 
@@ -97,7 +94,7 @@ export default function Memories() {
 
   useEffect(() => {
     loadMemories()
-  }, [user?.id, showUnfiltered])
+  }, [user?.id])
 
   // Semantic search handlers
   const handleSemanticSearch = async () => {
@@ -272,18 +269,7 @@ export default function Memories() {
 
       {/* Controls */}
       <div className="space-y-4 mb-6">
-        <div className="flex items-center justify-between">
-          <div className="flex items-center space-x-4">
-            <label className="flex items-center space-x-2 text-sm">
-              <input
-                type="checkbox"
-                checked={showUnfiltered}
-                onChange={(e) => setShowUnfiltered(e.target.checked)}
-                className="rounded border-gray-300"
-              />
-              <span className="text-gray-700 dark:text-gray-300">Show unfiltered</span>
-            </label>
-          </div>
+        <div className="flex items-center justify-end">
           <button
             onClick={loadMemories}
             disabled={loading || !user}
@@ -415,9 +401,9 @@ export default function Memories() {
                 )
               ) : (
                 totalCount !== null ? (
-                  `Showing ${memories.length} of ${totalCount} ${showUnfiltered ? 'unfiltered' : 'filtered'} memories`
+                  `Showing ${memories.length} of ${totalCount} memories`
                 ) : (
-                  `Showing ${showUnfiltered ? 'unfiltered' : 'filtered'} memories (${memories.length} found)`
+                  `Showing ${memories.length} memories`
                 )
               )}
             </p>
diff --git a/backends/advanced/webui/src/services/api.ts b/backends/advanced/webui/src/services/api.ts
index 88ce8f58..4264e9e0 100644
--- a/backends/advanced/webui/src/services/api.ts
+++ b/backends/advanced/webui/src/services/api.ts
@@ -122,6 +122,15 @@ export const conversationsApi = {
   reprocessMemory: (conversationId: string, transcriptVersionId: string = 'active') => api.post(`/api/conversations/${conversationId}/reprocess-memory`, null, {
     params: { transcript_version_id: transcriptVersionId }
   }),
+  reprocessSpeakers: (
+    conversationId: string,
+    transcriptVersionId: string = 'active'
+  ) =>
+    api.post(`/api/conversations/${conversationId}/reprocess-speakers`, null, {
+      params: {
+        transcript_version_id: transcriptVersionId
+      }
+    }),
 
   // Version management
   activateTranscriptVersion: (conversationId: string, versionId: string) => api.post(`/api/conversations/${conversationId}/activate-transcript/${versionId}`),
@@ -132,7 +141,6 @@ export const conversationsApi = {
 export const memoriesApi = {
   getAll: (userId?: string) => api.get('/api/memories', { params: userId ? { user_id: userId } : {} }),
   getById: (id: string, userId?: string) => api.get(`/api/memories/${id}`, { params: userId ? { user_id: userId } : {} }),
-  getUnfiltered: (userId?: string) => api.get('/api/memories/unfiltered', { params: userId ? { user_id: userId } : {} }),
   search: (query: string, userId?: string, limit: number = 20, scoreThreshold?: number) =>
     api.get('/api/memories/search', {
       params: {
diff --git a/extras/speaker-recognition/.env.template b/extras/speaker-recognition/.env.template
index 8c9404a7..60c7cc15 100644
--- a/extras/speaker-recognition/.env.template
+++ b/extras/speaker-recognition/.env.template
@@ -27,3 +27,19 @@ DEEPGRAM_API_KEY=
 
 # Groq API key (for LLM features)
 GROQ_API_KEY=
+
+# ========================================
+# Service Configuration (auto-configured by wizard)
+# ========================================
+
+# PyTorch CUDA version (cpu for CPU-only, cu126/cu121/cu118 for GPU)
+# PYTORCH_CUDA_VERSION=cpu
+
+# Service binding configuration
+# SPEAKER_SERVICE_HOST=0.0.0.0
+# SPEAKER_SERVICE_PORT=8085
+
+# React UI configuration
+# REACT_UI_HOST=0.0.0.0
+# REACT_UI_PORT=5174
+# REACT_UI_HTTPS=false
diff --git a/extras/speaker-recognition/init.py b/extras/speaker-recognition/init.py
index b69e04ee..649238a9 100755
--- a/extras/speaker-recognition/init.py
+++ b/extras/speaker-recognition/init.py
@@ -209,9 +209,7 @@ def setup_compute_mode(self):
             choice = self.prompt_choice("Choose compute mode:", choices, "1")
             compute_mode = "gpu" if choice == "2" else "cpu"
 
-        self.config["COMPUTE_MODE"] = compute_mode
-
-        # Set PYTORCH_CUDA_VERSION for Docker build
+        # Set PYTORCH_CUDA_VERSION for Docker build (profile determined from this)
         if compute_mode == "cpu":
             self.config["PYTORCH_CUDA_VERSION"] = "cpu"
         else:
@@ -250,6 +248,11 @@ def setup_compute_mode(self):
 
         self.console.print(f"[blue][INFO][/blue] Using {compute_mode.upper()} mode with PyTorch CUDA version: {self.config['PYTORCH_CUDA_VERSION']}")
 
+        # Set service host and port defaults
+        self.config["SPEAKER_SERVICE_HOST"] = "0.0.0.0"
+        self.config["SPEAKER_SERVICE_PORT"] = "8085"
+        self.config["REACT_UI_HOST"] = "0.0.0.0"
+
     def setup_deepgram(self):
         """Configure Deepgram API key if provided"""
         # Only set if provided via command line
@@ -373,7 +376,9 @@ def show_summary(self):
         self.console.print()
 
         self.console.print(f"✅ HF Token: {'Configured' if self.config.get('HF_TOKEN') else 'Not configured'}")
-        self.console.print(f"✅ Compute Mode: {self.config.get('COMPUTE_MODE', 'Not configured')}")
+        pytorch_version = self.config.get('PYTORCH_CUDA_VERSION', 'cpu')
+        compute_mode = 'GPU' if pytorch_version.startswith('cu') else 'CPU'
+        self.console.print(f"✅ Compute Mode: {compute_mode} ({pytorch_version})")
         self.console.print(f"✅ HTTPS Enabled: {self.config.get('REACT_UI_HTTPS', 'false')}")
         if self.config.get('DEEPGRAM_API_KEY'):
             self.console.print(f"✅ Deepgram API Key: Configured")
diff --git a/extras/speaker-recognition/src/simple_speaker_recognition/api/routers/identification.py b/extras/speaker-recognition/src/simple_speaker_recognition/api/routers/identification.py
index 9e5e48cf..15a6ef7f 100644
--- a/extras/speaker-recognition/src/simple_speaker_recognition/api/routers/identification.py
+++ b/extras/speaker-recognition/src/simple_speaker_recognition/api/routers/identification.py
@@ -97,9 +97,46 @@ async def diarize_and_identify(
     log.info("Processing diarize-and-identify request")
     log.info(f"Parameters - min_duration: {min_duration}, similarity_threshold: {similarity_threshold}, identify_only_enrolled: {identify_only_enrolled}, user_id: {user_id}, min_speakers: {min_speakers}, max_speakers: {max_speakers}, collar: {collar}, min_duration_off: {min_duration_off}")
     log.info(f"File - name: {file.filename}, content_type: {file.content_type}, size: {file.size if hasattr(file, 'size') else 'unknown'}")
-    
+
+    # Early validation: Validate file presence
+    if not file or not file.filename:
+        log.error("❌ VALIDATION ERROR: No audio file provided")
+        raise HTTPException(
+            400,
+            detail={
+                "error": "validation_error",
+                "message": "No audio file provided",
+                "field": "file"
+            }
+        )
+
     # Read audio data once
     audio_data = await file.read()
+
+    # Early validation: Validate non-empty
+    if len(audio_data) == 0:
+        log.error("❌ VALIDATION ERROR: Audio file is empty")
+        raise HTTPException(
+            400,
+            detail={
+                "error": "validation_error",
+                "message": "Audio file is empty",
+                "field": "file"
+            }
+        )
+
+    # Resource check - verify backend is initialized
+    audio_backend = get_audio_backend()
+    if not audio_backend:
+        log.error("❌ RESOURCE ERROR: Audio backend not initialized")
+        raise HTTPException(
+            503,
+            detail={
+                "error": "resource_error",
+                "message": "Audio backend not initialized",
+                "resource": "audio_backend"
+            }
+        )
     
     # Save to temp file for processing
     with secure_temp_file() as tmp:
@@ -121,9 +158,9 @@ async def diarize_and_identify(
         log.info(f"Step 1: Performing speaker diarization on {tmp_path}")
         if min_speakers or max_speakers:
             log.info(f"Using speaker constraints: min={min_speakers}, max={max_speakers}")
-        
-        audio_backend = get_audio_backend()
-        segments = await audio_backend.async_diarize(tmp_path, min_speakers=min_speakers, max_speakers=max_speakers, 
+
+        # Use audio_backend from early validation (already checked above)
+        segments = await audio_backend.async_diarize(tmp_path, min_speakers=min_speakers, max_speakers=max_speakers,
                                                      collar=collar, min_duration_off=min_duration_off)
         
         # Log what PyAnnote produced
@@ -316,19 +353,46 @@ async def diarize_identify_match(
     if conversation_id and not backend_token:
         raise HTTPException(400, "backend_token required when using conversation_id")
 
-    # Parse transcript data
+    # Early validation: Parse transcript_data FIRST (fail fast if invalid)
     try:
         transcript = json.loads(transcript_data)
         words = transcript.get("words", [])
     except json.JSONDecodeError as e:
         error_msg = f"Invalid transcript_data JSON: {str(e)}"
-        log.error(f"❌ {error_msg}")
-        raise HTTPException(400, error_msg) from e
+        log.error(f"❌ VALIDATION ERROR: {error_msg}")
+        raise HTTPException(
+            400,
+            detail={
+                "error": "validation_error",
+                "message": error_msg,
+                "field": "transcript_data"
+            }
+        ) from e
 
     if not words:
         error_msg = f"No words found in transcript_data (transcript keys: {list(transcript.keys())}, words type: {type(words)})"
-        log.error(f"❌ {error_msg}")
-        raise HTTPException(400, error_msg)
+        log.error(f"❌ VALIDATION ERROR: {error_msg}")
+        raise HTTPException(
+            400,
+            detail={
+                "error": "validation_error",
+                "message": error_msg,
+                "field": "transcript_data.words"
+            }
+        )
+
+    # Resource check - verify model is loaded before processing
+    audio_backend = get_audio_backend()
+    if not audio_backend or not hasattr(audio_backend, 'async_diarize'):
+        log.error("❌ RESOURCE ERROR: Diarization model not loaded")
+        raise HTTPException(
+            503,
+            detail={
+                "error": "resource_error",
+                "message": "Diarization model not loaded",
+                "resource": "diarization_model"
+            }
+        )
 
     # Get settings for chunking configuration
     from simple_speaker_recognition.api.service import auth as settings
@@ -395,7 +459,7 @@ async def diarize_identify_match(
         if min_speakers or max_speakers:
             log.info(f"Using speaker constraints: min={min_speakers}, max={max_speakers}")
 
-        audio_backend = get_audio_backend()
+        # Use audio_backend from early validation (already checked above)
         diarization_segments = await audio_backend.async_diarize(
             tmp_path,
             min_speakers=min_speakers,