From 03df5595c3a8405f9fa7356f335caeecb7f737d4 Mon Sep 17 00:00:00 2001
From: Abhishek Kumar <abhishek@a6k.me>
Date: Sat, 4 Apr 2026 14:26:47 +0530
Subject: [PATCH] feat: add worker sync events

Add a worker sync event so that runtime updates on one worker can propagate across other workers using pubsub for multi worker deployments
---
 api/AGENTS.md                           |  22 +--
 api/app.py                              |  20 ++-
 api/db/knowledge_base_client.py         |   1 +
 api/enums.py                            |   1 +
 api/routes/organization.py              |  22 +--
 api/services/pipecat/tracing_config.py  |  30 ++++
 api/services/worker_sync/__init__.py    |   0
 api/services/worker_sync/manager.py     | 114 ++++++++++++++
 api/services/worker_sync/protocol.py    |  48 ++++++
 api/tasks/knowledge_base_processing.py  | 189 ++++++++++++++++--------
 docs/configurations/tracing.mdx         |  22 +--
 pipecat                                 |   2 +-
 ui/AGENTS.md                            |  17 +++
 ui/src/app/files/DocumentUpload.tsx     |   2 +-
 ui/src/app/handler/[...stack]/page.tsx  |  13 --
 ui/src/app/settings/page.tsx            |  37 +++++
 ui/src/components/TelemetrySection.tsx  |  11 +-
 ui/src/components/layout/AppSidebar.tsx |   8 +
 18 files changed, 446 insertions(+), 113 deletions(-)
 create mode 100644 api/services/worker_sync/__init__.py
 create mode 100644 api/services/worker_sync/manager.py
 create mode 100644 api/services/worker_sync/protocol.py
 create mode 100644 ui/src/app/settings/page.tsx

diff --git a/api/AGENTS.md b/api/AGENTS.md
index 3db1fa9..9c7e287 100644
--- a/api/AGENTS.md
+++ b/api/AGENTS.md
@@ -20,15 +20,15 @@ api/
 
 ## Where to Find Things
 
-| Looking for... | Go to... |
-|----------------|----------|
-| API endpoints | `routes/` - each file is a router module, aggregated in `routes/main.py` |
-| Business logic | `services/` - organized by domain (telephony, workflow, campaign, etc.) |
-| Database models | `db/models.py` |
-| Database queries | `db/*_client.py` files (repository pattern) |
-| Request/response types | `schemas/` |
-| Background tasks | `tasks/` - uses ARQ for async job processing |
-| Environment config | `constants.py` |
+| Looking for...         | Go to...                                                                 |
+| ---------------------- | ------------------------------------------------------------------------ |
+| API endpoints          | `routes/` - each file is a router module, aggregated in `routes/main.py` |
+| Business logic         | `services/` - organized by domain (telephony, workflow, campaign, etc.)  |
+| Database models        | `db/models.py`                                                           |
+| Database queries       | `db/*_client.py` files (repository pattern)                              |
+| Request/response types | `schemas/`                                                               |
+| Background tasks       | `tasks/` - uses ARQ for async job processing                             |
+| Environment config     | `constants.py`                                                           |
 
 ## API Structure
 
@@ -43,6 +43,10 @@ api/
 ./scripts/migrate.sh                     # Run migrations
 ```
 
+## Cross-Worker State Sync
+
+When an API endpoint updates in-memory state (e.g. cached credentials, config objects), that change only affects the worker process that handled the request. With multiple FastAPI workers, **use `WorkerSyncManager`** (`services/worker_sync/`) to propagate changes to all workers via Redis pub/sub instead of updating local state directly.
+
 ## Development
 
 ```bash
diff --git a/api/app.py b/api/app.py
index 3538a60..1a2a7c8 100644
--- a/api/app.py
+++ b/api/app.py
@@ -26,8 +26,17 @@ from fastapi import APIRouter, FastAPI
 from fastapi.middleware.cors import CORSMiddleware
 from loguru import logger
 
+from api.constants import REDIS_URL
 from api.routes.main import router as main_router
-from api.services.pipecat.tracing_config import load_all_org_langfuse_credentials
+from api.services.pipecat.tracing_config import (
+    handle_langfuse_sync,
+    load_all_org_langfuse_credentials,
+)
+from api.services.worker_sync.manager import (
+    WorkerSyncManager,
+    set_worker_sync_manager,
+)
+from api.services.worker_sync.protocol import WorkerSyncEventType
 from api.tasks.arq import get_arq_redis
 
 API_PREFIX = "/api/v1"
@@ -42,10 +51,19 @@ async def lifespan(app: FastAPI):
     # before any pipeline runs, without per-call DB lookups.
     await load_all_org_langfuse_credentials()
 
+    # Start cross-worker sync manager so config changes propagate to all workers
+    sync_manager = WorkerSyncManager(REDIS_URL)
+    sync_manager.register(
+        WorkerSyncEventType.LANGFUSE_CREDENTIALS, handle_langfuse_sync
+    )
+    await sync_manager.start()
+    set_worker_sync_manager(sync_manager)
+
     yield  # Run app
 
     # Shutdown sequence - this runs when FastAPI is shutting down
     logger.info("Starting graceful shutdown...")
+    await sync_manager.stop()
 
 
 app = FastAPI(
diff --git a/api/db/knowledge_base_client.py b/api/db/knowledge_base_client.py
index 835b25a..bcedb16 100644
--- a/api/db/knowledge_base_client.py
+++ b/api/db/knowledge_base_client.py
@@ -493,6 +493,7 @@ class KnowledgeBaseClient(BaseDBClient):
             ".docx": "application/vnd.openxmlformats-officedocument.wordprocessingml.document",
             ".doc": "application/msword",
             ".txt": "text/plain",
+            ".json": "application/json",
             ".html": "text/html",
             ".md": "text/markdown",
         }
diff --git a/api/enums.py b/api/enums.py
index 85b6829..95d3c62 100644
--- a/api/enums.py
+++ b/api/enums.py
@@ -103,6 +103,7 @@ class RedisChannel(Enum):
     """Redis pub/sub channel names"""
 
     CAMPAIGN_EVENTS = "campaign_events"
+    WORKER_SYNC = "worker_sync"
 
 
 class TriggerState(Enum):
diff --git a/api/routes/organization.py b/api/routes/organization.py
index 088cabf..854fab1 100644
--- a/api/routes/organization.py
+++ b/api/routes/organization.py
@@ -24,7 +24,8 @@ from api.schemas.telephony_config import (
 )
 from api.services.auth.depends import get_user
 from api.services.configuration.masking import is_mask_of, mask_key
-from api.services.pipecat.tracing_config import unregister_org_langfuse_credentials
+from api.services.worker_sync.manager import get_worker_sync_manager
+from api.services.worker_sync.protocol import WorkerSyncEventType
 
 router = APIRouter(prefix="/organizations", tags=["organizations"])
 
@@ -341,14 +342,11 @@ async def save_langfuse_credentials(
         config_value,
     )
 
-    # Update the in-memory OTEL exporter so new traces route immediately
-    from api.services.pipecat.tracing_config import register_org_langfuse_credentials
-
-    register_org_langfuse_credentials(
+    # Broadcast to all workers so every process updates its in-memory exporter
+    await get_worker_sync_manager().broadcast(
+        WorkerSyncEventType.LANGFUSE_CREDENTIALS,
+        action="update",
         org_id=user.selected_organization_id,
-        host=config_value["host"],
-        public_key=config_value["public_key"],
-        secret_key=config_value["secret_key"],
     )
 
     return {"message": "Langfuse credentials saved successfully"}
@@ -368,8 +366,12 @@ async def delete_langfuse_credentials(user: UserModel = Depends(get_user)):
     if not deleted:
         raise HTTPException(status_code=404, detail="No Langfuse credentials found")
 
-    # Remove the in-memory OTEL exporter so traces fall back to default
-    unregister_org_langfuse_credentials(user.selected_organization_id)
+    # Broadcast to all workers so every process removes its in-memory exporter
+    await get_worker_sync_manager().broadcast(
+        WorkerSyncEventType.LANGFUSE_CREDENTIALS,
+        action="delete",
+        org_id=user.selected_organization_id,
+    )
 
     return {"message": "Langfuse credentials deleted successfully"}
 
diff --git a/api/services/pipecat/tracing_config.py b/api/services/pipecat/tracing_config.py
index f71ad27..e2db809 100644
--- a/api/services/pipecat/tracing_config.py
+++ b/api/services/pipecat/tracing_config.py
@@ -223,6 +223,36 @@ async def load_all_org_langfuse_credentials():
     logger.info(f"Loaded Langfuse credentials for {len(configs)} org(s)")
 
 
+async def handle_langfuse_sync(event):
+    """Worker sync handler: refresh a single org's Langfuse exporter from DB."""
+    from api.db import db_client
+    from api.enums import OrganizationConfigurationKey
+
+    org_id = event.org_id
+
+    logger.info(
+        f"handle_langfuse_sync for org_id: {event.org_id} action: {event.action}"
+    )
+
+    if event.action == "delete":
+        unregister_org_langfuse_credentials(org_id)
+        return
+
+    config = await db_client.get_configuration(
+        org_id, OrganizationConfigurationKey.LANGFUSE_CREDENTIALS.value
+    )
+    if config and config.value:
+        register_org_langfuse_credentials(
+            org_id=org_id,
+            host=config.value.get("host"),
+            public_key=config.value.get("public_key"),
+            secret_key=config.value.get("secret_key"),
+        )
+    else:
+        # Credentials were saved then deleted before we got the event
+        unregister_org_langfuse_credentials(org_id)
+
+
 def get_trace_url(trace_id: str, org_id=None) -> str | None:
     """Build a Langfuse trace URL, using org-specific host when available."""
     if org_id is None:
diff --git a/api/services/worker_sync/__init__.py b/api/services/worker_sync/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/api/services/worker_sync/manager.py b/api/services/worker_sync/manager.py
new file mode 100644
index 0000000..b0ae2a5
--- /dev/null
+++ b/api/services/worker_sync/manager.py
@@ -0,0 +1,114 @@
+"""Worker sync manager for cross-worker state propagation.
+
+Each FastAPI worker both publishes and listens on a single Redis pub/sub
+channel.  When shared state changes (e.g. Langfuse credentials), the worker
+that handled the mutation broadcasts a lightweight event.  Every worker
+(including the sender) receives it and runs the registered handler, which
+re-reads authoritative state from the DB.
+"""
+
+import asyncio
+from typing import Awaitable, Callable, Dict
+
+import redis.asyncio as aioredis
+from loguru import logger
+
+from api.enums import RedisChannel
+from api.services.worker_sync.protocol import WorkerSyncEvent
+
+SyncHandler = Callable[[WorkerSyncEvent], Awaitable[None]]
+
+
+class WorkerSyncManager:
+    """Propagates state changes across FastAPI workers via Redis pub/sub."""
+
+    def __init__(self, redis_url: str):
+        self._redis_url = redis_url
+        self._handlers: Dict[str, SyncHandler] = {}
+        self._redis: aioredis.Redis | None = None
+        self._pubsub: aioredis.client.PubSub | None = None
+        self._listener_task: asyncio.Task | None = None
+
+    def register(self, event_type: str, handler: SyncHandler):
+        """Register a handler for an event type. Call before start()."""
+        self._handlers[event_type] = handler
+        logger.info(f"Worker sync handler registered: {event_type}")
+
+    async def broadcast(self, event_type: str, action: str, org_id: str = ""):
+        """Publish an event to all workers (including self)."""
+        if not self._redis:
+            logger.warning("WorkerSyncManager not started, skipping broadcast")
+            return
+        event = WorkerSyncEvent(event_type=event_type, action=action, org_id=org_id)
+        await self._redis.publish(RedisChannel.WORKER_SYNC.value, event.to_json())
+        logger.debug(f"Broadcast worker sync: {event_type}/{action} org={org_id}")
+
+    async def start(self):
+        """Open a dedicated Redis connection and start the background listener."""
+        self._redis = await aioredis.from_url(self._redis_url, decode_responses=True)
+        self._pubsub = self._redis.pubsub()
+        await self._pubsub.subscribe(RedisChannel.WORKER_SYNC.value)
+        self._listener_task = asyncio.create_task(self._listen())
+        logger.info("WorkerSyncManager started")
+
+    async def stop(self):
+        """Cancel the listener and close the Redis connection."""
+        if self._listener_task:
+            self._listener_task.cancel()
+            try:
+                await self._listener_task
+            except asyncio.CancelledError:
+                pass
+        if self._pubsub:
+            await self._pubsub.unsubscribe(RedisChannel.WORKER_SYNC.value)
+            await self._pubsub.close()
+        if self._redis:
+            await self._redis.close()
+        logger.info("WorkerSyncManager stopped")
+
+    async def _listen(self):
+        """Background loop: receive events and dispatch to handlers."""
+        try:
+            async for message in self._pubsub.listen():
+                if message["type"] != "message":
+                    continue
+                event = WorkerSyncEvent.from_json(message["data"])
+                if not event:
+                    continue
+                handler = self._handlers.get(event.event_type)
+                if handler:
+                    try:
+                        await handler(event)
+                    except Exception:
+                        logger.exception(
+                            f"Worker sync handler error: {event.event_type}"
+                        )
+                else:
+                    logger.warning(
+                        f"No handler for worker sync event: {event.event_type}"
+                    )
+        except asyncio.CancelledError:
+            raise
+        except Exception:
+            logger.exception("Worker sync listener crashed")
+
+
+# Module-level singleton, initialized in app lifespan
+_manager: WorkerSyncManager | None = None
+
+
+def get_worker_sync_manager() -> WorkerSyncManager:
+    """Get the active WorkerSyncManager instance.
+
+    Raises RuntimeError if called before the manager is started (i.e. outside
+    the FastAPI lifespan).
+    """
+    if _manager is None:
+        raise RuntimeError("WorkerSyncManager not initialized")
+    return _manager
+
+
+def set_worker_sync_manager(manager: WorkerSyncManager):
+    """Set the module-level singleton. Called from the app lifespan."""
+    global _manager
+    _manager = manager
diff --git a/api/services/worker_sync/protocol.py b/api/services/worker_sync/protocol.py
new file mode 100644
index 0000000..633091e
--- /dev/null
+++ b/api/services/worker_sync/protocol.py
@@ -0,0 +1,48 @@
+"""Worker sync event protocol.
+
+Defines the message format for cross-worker state synchronization via Redis pub/sub.
+"""
+
+import json
+from dataclasses import asdict, dataclass
+from enum import Enum
+from typing import Optional
+
+from loguru import logger
+
+
+class WorkerSyncEventType(str, Enum):
+    """Types of worker sync events."""
+
+    LANGFUSE_CREDENTIALS = "langfuse_credentials"
+
+
+@dataclass
+class WorkerSyncEvent:
+    """A notification that some shared state has changed.
+
+    Handlers should re-read authoritative state from the DB rather than
+    relying on fields in the event — the event is just a trigger.
+    """
+
+    event_type: str  # handler key, e.g. "langfuse_credentials"
+    action: str  # "update" or "delete"
+    org_id: str = ""
+    timestamp: Optional[str] = None
+
+    def __post_init__(self):
+        if self.timestamp is None:
+            from datetime import UTC, datetime
+
+            self.timestamp = datetime.now(UTC).isoformat()
+
+    def to_json(self) -> str:
+        return json.dumps(asdict(self))
+
+    @classmethod
+    def from_json(cls, data: str) -> Optional["WorkerSyncEvent"]:
+        try:
+            return cls(**json.loads(data))
+        except Exception as e:
+            logger.error(f"Failed to parse worker sync event: {e}, data: {data}")
+            return None
diff --git a/api/tasks/knowledge_base_processing.py b/api/tasks/knowledge_base_processing.py
index e4fbaaf..1436bd1 100644
--- a/api/tasks/knowledge_base_processing.py
+++ b/api/tasks/knowledge_base_processing.py
@@ -1,5 +1,6 @@
 """ARQ background task for processing knowledge base documents."""
 
+import json
 import os
 import tempfile
 
@@ -163,84 +164,148 @@ async def process_knowledge_base_document(
             base_url=embeddings_base_url,
         )
 
-        # Step 1: Convert document with docling
-        logger.info("Converting document with docling")
-        converter = DocumentConverter()
-        conversion_result = converter.convert(temp_file_path)
-        doc = conversion_result.document
-
-        # Store docling metadata
-        docling_metadata = {
-            "num_pages": len(doc.pages) if hasattr(doc, "pages") else None,
-            "document_type": type(doc).__name__,
-        }
-
-        # Step 2: Initialize tokenizer for chunking
+        # Step 1: Initialize tokenizer for chunking
         logger.info(
             f"Loading tokenizer: {TOKENIZER_MODEL} with max_tokens={max_tokens}"
         )
+        hf_tokenizer = AutoTokenizer.from_pretrained(TOKENIZER_MODEL)
         tokenizer = HuggingFaceTokenizer(
-            tokenizer=AutoTokenizer.from_pretrained(TOKENIZER_MODEL),
+            tokenizer=hf_tokenizer,
             max_tokens=max_tokens,
         )
 
-        # Step 3: Initialize chunker
-        logger.info(f"Initializing HybridChunker with max_tokens={max_tokens}")
-        chunker = HybridChunker(tokenizer=tokenizer)
-
-        # Step 4: Chunk the document
-        logger.info(f"Chunking document with max_tokens={max_tokens}")
-        chunks = list(chunker.chunk(dl_doc=doc))
-        total_chunks = len(chunks)
-        logger.info(f"Generated {total_chunks} chunks")
-
-        # Step 5: Process each chunk
         chunk_texts = []
         chunk_records = []
         token_counts = []
 
-        for i, chunk in enumerate(chunks):
-            chunk_text = chunk.text
-            contextualized_text = chunker.contextualize(chunk=chunk)
+        # Check if file is a plain text format that docling doesn't support
+        plain_text_extensions = {".txt", ".json"}
+        if file_extension.lower() in plain_text_extensions:
+            # Read text content directly
+            logger.info(f"Reading {file_extension} file directly (bypassing docling)")
+            with open(temp_file_path, "r", encoding="utf-8") as f:
+                raw_content = f.read()
 
-            # Calculate token count
-            text_to_tokenize = (
-                contextualized_text if contextualized_text else chunk_text
-            )
-            token_count = len(
-                tokenizer.tokenizer.encode(text_to_tokenize, add_special_tokens=False)
-            )
-            token_counts.append(token_count)
+            # For JSON files, pretty-print for better readability
+            if file_extension.lower() == ".json":
+                try:
+                    parsed = json.loads(raw_content)
+                    raw_content = json.dumps(parsed, indent=2, ensure_ascii=False)
+                except json.JSONDecodeError:
+                    logger.warning(
+                        "JSON file is not valid JSON, treating as plain text"
+                    )
 
-            # Prepare chunk metadata
-            chunk_metadata = {}
-            if hasattr(chunk, "meta") and chunk.meta:
-                chunk_metadata = {
-                    "doc_items": (
-                        [str(item) for item in chunk.meta.doc_items]
-                        if hasattr(chunk.meta, "doc_items")
-                        else []
-                    ),
-                    "headings": (
-                        chunk.meta.headings if hasattr(chunk.meta, "headings") else []
-                    ),
-                }
+            docling_metadata = {
+                "num_pages": None,
+                "document_type": "PlainText",
+            }
 
-            # Create chunk record (without embedding yet)
-            chunk_record = KnowledgeBaseChunkModel(
-                document_id=document_id,
-                organization_id=organization_id,
-                chunk_text=chunk_text,
-                contextualized_text=contextualized_text,
-                chunk_index=i,
-                chunk_metadata=chunk_metadata,
-                embedding_model=service.get_model_id(),
-                embedding_dimension=service.get_embedding_dimension(),
-                token_count=token_count,
+            # Token-based chunking for plain text
+            tokens = hf_tokenizer.encode(raw_content, add_special_tokens=False)
+            total_tokens = len(tokens)
+            logger.info(
+                f"Total tokens in file: {total_tokens}, chunking with max_tokens={max_tokens}"
             )
 
-            chunk_records.append(chunk_record)
-            chunk_texts.append(text_to_tokenize)
+            start = 0
+            chunk_index = 0
+            while start < total_tokens:
+                end = min(start + max_tokens, total_tokens)
+                chunk_token_ids = tokens[start:end]
+                chunk_text = hf_tokenizer.decode(
+                    chunk_token_ids, skip_special_tokens=True
+                )
+
+                token_count = len(chunk_token_ids)
+                token_counts.append(token_count)
+
+                chunk_record = KnowledgeBaseChunkModel(
+                    document_id=document_id,
+                    organization_id=organization_id,
+                    chunk_text=chunk_text,
+                    contextualized_text=chunk_text,
+                    chunk_index=chunk_index,
+                    chunk_metadata={},
+                    embedding_model=service.get_model_id(),
+                    embedding_dimension=service.get_embedding_dimension(),
+                    token_count=token_count,
+                )
+
+                chunk_records.append(chunk_record)
+                chunk_texts.append(chunk_text)
+                chunk_index += 1
+                start = end
+
+            total_chunks = len(chunk_records)
+            logger.info(f"Generated {total_chunks} chunks from plain text")
+
+        else:
+            # Use docling for structured formats (PDF, DOCX, etc.)
+            logger.info("Converting document with docling")
+            converter = DocumentConverter()
+            conversion_result = converter.convert(temp_file_path)
+            doc = conversion_result.document
+
+            docling_metadata = {
+                "num_pages": len(doc.pages) if hasattr(doc, "pages") else None,
+                "document_type": type(doc).__name__,
+            }
+
+            # Initialize chunker
+            logger.info(f"Initializing HybridChunker with max_tokens={max_tokens}")
+            chunker = HybridChunker(tokenizer=tokenizer)
+
+            # Chunk the document
+            logger.info(f"Chunking document with max_tokens={max_tokens}")
+            chunks = list(chunker.chunk(dl_doc=doc))
+            total_chunks = len(chunks)
+            logger.info(f"Generated {total_chunks} chunks")
+
+            # Process each chunk
+            for i, chunk in enumerate(chunks):
+                chunk_text = chunk.text
+                contextualized_text = chunker.contextualize(chunk=chunk)
+
+                text_to_tokenize = (
+                    contextualized_text if contextualized_text else chunk_text
+                )
+                token_count = len(
+                    tokenizer.tokenizer.encode(
+                        text_to_tokenize, add_special_tokens=False
+                    )
+                )
+                token_counts.append(token_count)
+
+                chunk_metadata = {}
+                if hasattr(chunk, "meta") and chunk.meta:
+                    chunk_metadata = {
+                        "doc_items": (
+                            [str(item) for item in chunk.meta.doc_items]
+                            if hasattr(chunk.meta, "doc_items")
+                            else []
+                        ),
+                        "headings": (
+                            chunk.meta.headings
+                            if hasattr(chunk.meta, "headings")
+                            else []
+                        ),
+                    }
+
+                chunk_record = KnowledgeBaseChunkModel(
+                    document_id=document_id,
+                    organization_id=organization_id,
+                    chunk_text=chunk_text,
+                    contextualized_text=contextualized_text,
+                    chunk_index=i,
+                    chunk_metadata=chunk_metadata,
+                    embedding_model=service.get_model_id(),
+                    embedding_dimension=service.get_embedding_dimension(),
+                    token_count=token_count,
+                )
+
+                chunk_records.append(chunk_record)
+                chunk_texts.append(text_to_tokenize)
 
         # Log chunk statistics
         if token_counts:
diff --git a/docs/configurations/tracing.mdx b/docs/configurations/tracing.mdx
index 17fdb46..ca57293 100644
--- a/docs/configurations/tracing.mdx
+++ b/docs/configurations/tracing.mdx
@@ -106,28 +106,22 @@ Every time an LLM call is made, the **entire conversation history up to that poi
 - You can see exactly what context the LLM had when it made a decision
 - Useful for debugging unexpected responses
 
-## Setting Up Tracing in (Open Source) Self hosted Dograh AI
+## Setting Up Langfuse Tracing
 
-### Langfuse Integration
-
-We provide seamless integration with Langfuse for self-hosted Dograh deployments.
+We provide seamless integration with Langfuse for tracing if you want to use your own account. This enables you to use the [playground feature of Langfuse](https://langfuse.com/docs/prompt-management/features/playground). This works on both managed and self-hosted Dograh deployments.
 
 **Setup steps:**
 
 1. Sign up at [Langfuse](https://langfuse.com) and create API credentials
-2. Add the following [environment variables](/developer/environment-variables#tracing-langfuse) (in `docker-compose.yaml` for Docker deployments):
-
-```
-ENABLE_TRACING="true"
-LANGFUSE_SECRET_KEY=
-LANGFUSE_PUBLIC_KEY=
-LANGFUSE_HOST=
-```
-
-3. Restart your services
+2. In the Dograh UI, go to **Platform Settings** (`/settings`) and enter your Langfuse host, public key, and secret key
+3. Click **Save**
 
 Once enabled, traces will be available for every completed call in Dograh.
 
+<Note>
+For self-hosted deployments, you can also configure Langfuse via [environment variables](/developer/environment-variables#tracing-langfuse) (`ENABLE_TRACING`, `LANGFUSE_SECRET_KEY`, `LANGFUSE_PUBLIC_KEY`, `LANGFUSE_HOST`) if you prefer. The UI settings take precedence over environment variables.
+</Note>
+
 ## Quick Reference
 
 | Trace Type | What It Shows |
diff --git a/pipecat b/pipecat
index a2dc39c..43b231d 160000
--- a/pipecat
+++ b/pipecat
@@ -1 +1 @@
-Subproject commit a2dc39c0d706e420121d045183554f378fe9d841
+Subproject commit 43b231d8a8f30d1afacda6f35d334ef0efb223be
diff --git a/ui/AGENTS.md b/ui/AGENTS.md
index e821582..83f818b 100644
--- a/ui/AGENTS.md
+++ b/ui/AGENTS.md
@@ -54,6 +54,23 @@ npm run generate-client
 
 Always use a hidden `<input type="file">` with a visible `<Button>` that triggers it via `fileInputRef.current?.click()`. Never use a visible `<Input type="file">` — the native file input styling is inconsistent and confusing. Show the selected filename next to or below the button.
 
+### Authenticated API Calls
+
+Components that make API calls must wait for auth to be ready before fetching. Use `useAuth()` and guard the `useEffect` with `authLoading` and `user`:
+
+```tsx
+const { user, loading: authLoading } = useAuth();
+const hasFetched = useRef(false);
+
+useEffect(() => {
+  if (authLoading || !user || hasFetched.current) return;
+  hasFetched.current = true;
+  fetchData();
+}, [authLoading, user]);
+```
+
+The auth interceptor (which attaches the Bearer token) is only registered once auth is fully loaded. Fetching before that sends unauthenticated requests that silently fail.
+
 ## Development
 
 ```bash
diff --git a/ui/src/app/files/DocumentUpload.tsx b/ui/src/app/files/DocumentUpload.tsx
index 4ff002d..f79bb0a 100644
--- a/ui/src/app/files/DocumentUpload.tsx
+++ b/ui/src/app/files/DocumentUpload.tsx
@@ -18,7 +18,7 @@ interface DocumentUploadProps {
 }
 
 const MAX_FILE_SIZE = 5 * 1024 * 1024; // 5MB
-const ACCEPTED_FILE_TYPES = ['.pdf', '.docx', '.doc', '.txt'];
+const ACCEPTED_FILE_TYPES = ['.pdf', '.docx', '.doc', '.txt', '.json'];
 
 export default function DocumentUpload({ onUploadSuccess }: DocumentUploadProps) {
   const [uploading, setUploading] = useState(false);
diff --git a/ui/src/app/handler/[...stack]/page.tsx b/ui/src/app/handler/[...stack]/page.tsx
index acb76b3..2ae9448 100644
--- a/ui/src/app/handler/[...stack]/page.tsx
+++ b/ui/src/app/handler/[...stack]/page.tsx
@@ -1,6 +1,5 @@
 import { StackHandler } from "@stackframe/stack";
 
-import { TelemetrySection } from "@/components/TelemetrySection";
 import { getAuthProvider } from "@/lib/auth/config";
 
 import { BackButton } from "./BackButton";
@@ -29,18 +28,6 @@ export default async function Handler(props: unknown) {
           fullPage
           app={app!}
           routeProps={props}
-          componentProps={{
-            AccountSettings: {
-              extraItems: [
-                {
-                  id: "telemetry",
-                  title: "Telemetry",
-                  iconName: "Key",
-                  content: <TelemetrySection />,
-                },
-              ],
-            },
-          }}
         />
       </div>
     </div>
diff --git a/ui/src/app/settings/page.tsx b/ui/src/app/settings/page.tsx
new file mode 100644
index 0000000..1e8c91a
--- /dev/null
+++ b/ui/src/app/settings/page.tsx
@@ -0,0 +1,37 @@
+"use client";
+
+import { TelemetrySection } from "@/components/TelemetrySection";
+import {
+  Card,
+  CardContent,
+  CardDescription,
+  CardHeader,
+  CardTitle,
+} from "@/components/ui/card";
+
+export default function SettingsPage() {
+  return (
+    <div className="flex justify-center py-12 px-4">
+      <div className="w-full max-w-2xl space-y-6">
+        <div>
+          <h1 className="text-2xl font-bold">Platform Settings</h1>
+          <p className="text-muted-foreground">
+            Manage your platform configuration and integrations.
+          </p>
+        </div>
+
+        <Card>
+          <CardHeader>
+            <CardTitle>Telemetry</CardTitle>
+            <CardDescription>
+              Configure Langfuse tracing for your voice agent calls.
+            </CardDescription>
+          </CardHeader>
+          <CardContent>
+            <TelemetrySection />
+          </CardContent>
+        </Card>
+      </div>
+    </div>
+  );
+}
diff --git a/ui/src/components/TelemetrySection.tsx b/ui/src/components/TelemetrySection.tsx
index c7e94a3..4846d82 100644
--- a/ui/src/components/TelemetrySection.tsx
+++ b/ui/src/components/TelemetrySection.tsx
@@ -1,6 +1,6 @@
 "use client";
 
-import { useEffect, useState } from "react";
+import { useEffect, useRef, useState } from "react";
 import { toast } from "sonner";
 
 import {
@@ -12,8 +12,10 @@ import type { LangfuseCredentialsResponse } from "@/client/types.gen";
 import { Button } from "@/components/ui/button";
 import { Input } from "@/components/ui/input";
 import { Label } from "@/components/ui/label";
+import { useAuth } from "@/lib/auth";
 
 export function TelemetrySection() {
+  const { user, loading: authLoading } = useAuth();
   const [credentials, setCredentials] = useState<LangfuseCredentialsResponse>({
     host: "",
     public_key: "",
@@ -22,10 +24,15 @@ export function TelemetrySection() {
   });
   const [loading, setLoading] = useState(true);
   const [saving, setSaving] = useState(false);
+  const hasFetched = useRef(false);
 
   useEffect(() => {
+    if (authLoading || !user || hasFetched.current) {
+      return;
+    }
+    hasFetched.current = true;
     fetchCredentials();
-  }, []);
+  }, [authLoading, user]);
 
   async function fetchCredentials() {
     try {
diff --git a/ui/src/components/layout/AppSidebar.tsx b/ui/src/components/layout/AppSidebar.tsx
index e59385b..6aea615 100644
--- a/ui/src/components/layout/AppSidebar.tsx
+++ b/ui/src/components/layout/AppSidebar.tsx
@@ -398,6 +398,10 @@ export function AppSidebar() {
                     </div>
                   </DropdownMenuLabel>
                   <DropdownMenuSeparator />
+                  <DropdownMenuItem onClick={() => router.push("/settings")} className="cursor-pointer">
+                    <Settings className="mr-2 h-4 w-4" />
+                    Platform Settings
+                  </DropdownMenuItem>
                   <DropdownMenuItem onClick={() => logout()} className="cursor-pointer">
                     <LogOut className="mr-2 h-4 w-4" />
                     Sign out
@@ -443,6 +447,10 @@ export function AppSidebar() {
                     <Settings className="mr-2 h-4 w-4" />
                     Account settings
                   </DropdownMenuItem>
+                  <DropdownMenuItem onClick={() => router.push("/settings")} className="cursor-pointer">
+                    <Settings className="mr-2 h-4 w-4" />
+                    Platform Settings
+                  </DropdownMenuItem>
                   <DropdownMenuItem onClick={() => router.push("/usage")} className="cursor-pointer">
                     <CircleDollarSign className="mr-2 h-4 w-4" />
                     Usage