chore: fix tracing for text chat mode

2026-06-25 08:48:13 +02:00 · 2026-05-21 12:30:56 +05:30 · 2026-05-21 12:30:56 +05:30 · 08a2435ba5
commit 08a2435ba5
parent e23cce444f
31 changed files with 1753 additions and 597 deletions
--- a/api/services/pipecat/in_memory_buffers.py
+++ b/api/services/pipecat/in_memory_buffers.py
@ -6,6 +6,10 @@ from typing import List, Optional

 from loguru import logger

+from api.services.pipecat.realtime_feedback_events import (
+    realtime_feedback_event_sort_key,
+    stamp_realtime_feedback_event,
+)
 from api.utils.transcript import generate_transcript_text as _generate_transcript_text
 from pipecat.utils.enums import RealtimeFeedbackType

@ -98,16 +102,13 @@ class InMemoryLogsBuffer:

    async def append(self, event: dict):
        """Append a feedback event to the buffer with timestamp and current node."""
-        # Add timestamp, turn tracking, and current node
-        timestamped_event = {
-            **event,
-            "timestamp": datetime.now(UTC).isoformat(),
-            "turn": self._turn_counter,
-        }
-        if self._current_node_id:
-            timestamped_event["node_id"] = self._current_node_id
-        if self._current_node_name:
-            timestamped_event["node_name"] = self._current_node_name
+        timestamped_event = stamp_realtime_feedback_event(
+            event,
+            timestamp=datetime.now(UTC).isoformat(),
+            turn=self._turn_counter,
+            node_id=self._current_node_id,
+            node_name=self._current_node_name,
+        )
        self._events.append(timestamped_event)
        logger.trace(
            f"Appended event {event.get('type')} to logs buffer for workflow {self._workflow_run_id}"
@ -120,17 +121,12 @@ class InMemoryLogsBuffer:
            f"Incremented turn counter to {self._turn_counter} for workflow {self._workflow_run_id}"
        )

-    @staticmethod
-    def _event_sort_key(event: dict) -> str:
-        payload_ts = event.get("payload", {}).get("timestamp")
-        return payload_ts or event.get("timestamp", "")
-
    def _sorted_events(self) -> List[dict]:
        # Stable sort by the realtime (payload) timestamp when available, falling
        # back to the buffer-append timestamp. Python's sort is stable, so events
        # sharing a key retain their original insertion order — this keeps
        # consecutive bot-text chunks of a single turn contiguous.
-        return sorted(self._events, key=self._event_sort_key)
+        return sorted(self._events, key=realtime_feedback_event_sort_key)

    def get_events(self) -> List[dict]:
        """Get all events for final storage, ordered by realtime timestamp."""
--- a/api/services/pipecat/pipeline_builder.py
+++ b/api/services/pipecat/pipeline_builder.py
@ -152,8 +152,30 @@ def build_realtime_pipeline(
    return Pipeline(processors)


-def create_pipeline_task(pipeline, workflow_run_id, audio_config: AudioConfig = None):
-    """Create a pipeline task with appropriate parameters"""
+def create_pipeline_task(
+    pipeline,
+    workflow_run_id,
+    audio_config: AudioConfig = None,
+    *,
+    conversation_parent_context=None,
+    conversation_type: str = "voice",
+    additional_span_attributes: dict | None = None,
+):
+    """Create a pipeline task with appropriate parameters.
+
+    Args:
+        pipeline: The pipeline to run.
+        workflow_run_id: Run id, used as the conversation id.
+        audio_config: Optional audio configuration.
+        conversation_parent_context: Optional OTEL context carrying a fixed
+            trace id. When provided, the conversation span attaches to that
+            trace instead of starting a new root trace (used by text chat to
+            stitch every per-turn pipeline into one trace).
+        conversation_type: ``conversation.type`` span attribute value.
+        additional_span_attributes: Extra attributes set on the conversation
+            span (e.g. ``langfuse.trace.name`` to name a stitched trace that
+            has no real root span).
+    """
    # Set up pipeline params with audio configuration if provided
    pipeline_params = PipelineParams(
        enable_metrics=True,
@ -178,6 +200,9 @@ def create_pipeline_task(pipeline, workflow_run_id, audio_config: AudioConfig =
        enable_tracing=True,
        enable_rtvi=False,
        conversation_id=f"{workflow_run_id}",
+        conversation_parent_context=conversation_parent_context,
+        conversation_type=conversation_type,
+        additional_span_attributes=additional_span_attributes,
    )

    # Check if turn logging is enabled
--- a/api/services/pipecat/realtime_feedback_events.py
+++ b/api/services/pipecat/realtime_feedback_events.py
@ -0,0 +1,159 @@
+"""Shared helpers for building and ordering realtime feedback events."""
+
+from typing import Any
+
+from pipecat.utils.enums import RealtimeFeedbackType
+
+
+def build_node_transition_event(
+    *,
+    node_id: str | None,
+    node_name: str | None,
+    previous_node_id: str | None,
+    previous_node_name: str | None,
+    allow_interrupt: bool = False,
+) -> dict[str, Any]:
+    return {
+        "type": RealtimeFeedbackType.NODE_TRANSITION.value,
+        "payload": {
+            "node_id": node_id,
+            "node_name": node_name,
+            "previous_node_id": previous_node_id,
+            "previous_node_name": previous_node_name,
+            "allow_interrupt": allow_interrupt,
+        },
+    }
+
+
+def build_user_transcription_event(
+    *,
+    text: str,
+    final: bool,
+    timestamp: str | None = None,
+    user_id: str | None = None,
+) -> dict[str, Any]:
+    payload: dict[str, Any] = {
+        "text": text,
+        "final": final,
+    }
+    if timestamp is not None:
+        payload["timestamp"] = timestamp
+    if user_id is not None:
+        payload["user_id"] = user_id
+    return {
+        "type": RealtimeFeedbackType.USER_TRANSCRIPTION.value,
+        "payload": payload,
+    }
+
+
+def build_bot_text_event(
+    *,
+    text: str,
+    timestamp: str | None = None,
+) -> dict[str, Any]:
+    payload: dict[str, Any] = {"text": text}
+    if timestamp is not None:
+        payload["timestamp"] = timestamp
+    return {
+        "type": RealtimeFeedbackType.BOT_TEXT.value,
+        "payload": payload,
+    }
+
+
+def build_function_call_start_event(
+    *,
+    function_name: str | None,
+    tool_call_id: str | None,
+) -> dict[str, Any]:
+    return {
+        "type": RealtimeFeedbackType.FUNCTION_CALL_START.value,
+        "payload": {
+            "function_name": function_name,
+            "tool_call_id": tool_call_id,
+        },
+    }
+
+
+def serialize_realtime_feedback_tool_result(result: Any) -> str | None:
+    """Normalize function-call results to the string shape stored in logs."""
+    if result is None:
+        return None
+    return str(result)
+
+
+def build_function_call_end_event(
+    *,
+    function_name: str | None,
+    tool_call_id: str | None,
+    result: Any,
+) -> dict[str, Any]:
+    return {
+        "type": RealtimeFeedbackType.FUNCTION_CALL_END.value,
+        "payload": {
+            "function_name": function_name,
+            "tool_call_id": tool_call_id,
+            "result": serialize_realtime_feedback_tool_result(result),
+        },
+    }
+
+
+def build_ttfb_metric_event(
+    *,
+    ttfb_seconds: float,
+    processor: str | None,
+    model: str | None,
+) -> dict[str, Any]:
+    return {
+        "type": RealtimeFeedbackType.TTFB_METRIC.value,
+        "payload": {
+            "ttfb_seconds": ttfb_seconds,
+            "processor": processor,
+            "model": model,
+        },
+    }
+
+
+def build_pipeline_error_event(
+    *,
+    error: str,
+    fatal: bool,
+    processor: str | None = None,
+    extra_payload: dict[str, Any] | None = None,
+) -> dict[str, Any]:
+    payload: dict[str, Any] = {
+        "error": error,
+        "fatal": fatal,
+    }
+    if processor is not None:
+        payload["processor"] = processor
+    if extra_payload:
+        payload.update(extra_payload)
+    return {
+        "type": RealtimeFeedbackType.PIPELINE_ERROR.value,
+        "payload": payload,
+    }
+
+
+def stamp_realtime_feedback_event(
+    event: dict[str, Any],
+    *,
+    timestamp: str | None = None,
+    turn: int | None = None,
+    node_id: str | None = None,
+    node_name: str | None = None,
+) -> dict[str, Any]:
+    stamped = dict(event)
+    if timestamp is not None:
+        stamped["timestamp"] = timestamp
+    if turn is not None:
+        stamped["turn"] = turn
+    if node_id is not None:
+        stamped["node_id"] = node_id
+    if node_name is not None:
+        stamped["node_name"] = node_name
+    return stamped
+
+
+def realtime_feedback_event_sort_key(event: dict[str, Any]) -> str:
+    payload_timestamp = (event.get("payload") or {}).get("timestamp")
+    return payload_timestamp or event.get("timestamp") or ""
--- a/api/services/pipecat/realtime_feedback_observer.py
+++ b/api/services/pipecat/realtime_feedback_observer.py
@ -27,6 +27,15 @@ from typing import TYPE_CHECKING, Awaitable, Callable, Optional, Set

 from loguru import logger

+from api.services.pipecat.realtime_feedback_events import (
+    build_bot_text_event,
+    build_function_call_end_event,
+    build_function_call_start_event,
+    build_pipeline_error_event,
+    build_ttfb_metric_event,
+    build_user_transcription_event,
+)
+
 if TYPE_CHECKING:
    from api.services.pipecat.in_memory_buffers import InMemoryLogsBuffer

@ -211,29 +220,23 @@ class RealtimeFeedbackObserver(BaseObserver):
        # Handle user transcriptions (interim) - WebSocket only
        elif isinstance(frame, InterimTranscriptionFrame):
            await self._send_ws(
-                {
-                    "type": RealtimeFeedbackType.USER_TRANSCRIPTION.value,
-                    "payload": {
-                        "text": frame.text,
-                        "final": False,
-                        "user_id": frame.user_id,
-                        "timestamp": frame.timestamp,
-                    },
-                }
+                build_user_transcription_event(
+                    text=frame.text,
+                    final=False,
+                    user_id=frame.user_id,
+                    timestamp=frame.timestamp,
+                )
            )
        # Handle user transcriptions (final) - WebSocket only
        # Complete turn text is persisted via register_turn_handlers
        elif isinstance(frame, TranscriptionFrame):
            await self._send_ws(
-                {
-                    "type": RealtimeFeedbackType.USER_TRANSCRIPTION.value,
-                    "payload": {
-                        "text": frame.text,
-                        "final": True,
-                        "user_id": frame.user_id,
-                        "timestamp": frame.timestamp,
-                    },
-                }
+                build_user_transcription_event(
+                    text=frame.text,
+                    final=True,
+                    user_id=frame.user_id,
+                    timestamp=frame.timestamp,
+                )
            )
        # Handle engine-queued speech (transition/tool messages) marked for
        # log persistence. The downstream TTSTextFrame(s) from the TTS service
@ -241,23 +244,13 @@ class RealtimeFeedbackObserver(BaseObserver):
        # to avoid word-level log entries from word-timestamp providers.
        elif isinstance(frame, TTSSpeakFrame):
            if getattr(frame, "persist_to_logs", False):
-                await self._append_to_buffer(
-                    {
-                        "type": RealtimeFeedbackType.BOT_TEXT.value,
-                        "payload": {"text": frame.text},
-                    }
-                )
+                await self._append_to_buffer(build_bot_text_event(text=frame.text))
        # Handle bot TTS text - respect pts timing, WebSocket only
        # Complete turn text is persisted via register_turn_handlers,
        # except for frames explicitly flagged persist_to_logs (e.g. recording
        # transcripts from play_audio) which bypass the aggregator path.
        elif isinstance(frame, TTSTextFrame):
-            message = {
-                "type": RealtimeFeedbackType.BOT_TEXT.value,
-                "payload": {
-                    "text": frame.text,
-                },
-            }
+            message = build_bot_text_event(text=frame.text)

            # If frame has pts, queue it for timed delivery
            if frame.pts:
@ -280,13 +273,10 @@ class RealtimeFeedbackObserver(BaseObserver):
            and frame_direction == FrameDirection.DOWNSTREAM
        ):
            await self._send_message(
-                {
-                    "type": RealtimeFeedbackType.FUNCTION_CALL_START.value,
-                    "payload": {
-                        "function_name": frame.function_name,
-                        "tool_call_id": frame.tool_call_id,
-                    },
-                }
+                build_function_call_start_event(
+                    function_name=frame.function_name,
+                    tool_call_id=frame.tool_call_id,
+                )
            )
        # Handle function call result
        elif (
@ -294,14 +284,11 @@ class RealtimeFeedbackObserver(BaseObserver):
            and frame_direction == FrameDirection.DOWNSTREAM
        ):
            await self._send_message(
-                {
-                    "type": RealtimeFeedbackType.FUNCTION_CALL_END.value,
-                    "payload": {
-                        "function_name": frame.function_name,
-                        "tool_call_id": frame.tool_call_id,
-                        "result": str(frame.result) if frame.result else None,
-                    },
-                }
+                build_function_call_end_event(
+                    function_name=frame.function_name,
+                    tool_call_id=frame.tool_call_id,
+                    result=frame.result,
+                )
            )
        # Handle TTFB metrics - capture LLM generation time only
        elif isinstance(frame, MetricsFrame):
@ -311,47 +298,42 @@ class RealtimeFeedbackObserver(BaseObserver):
                    # Only send TTFB if it's from an LLM processor
                    if metric_data.processor and "LLM" in metric_data.processor:
                        await self._send_message(
-                            {
-                                "type": RealtimeFeedbackType.TTFB_METRIC.value,
-                                "payload": {
-                                    "ttfb_seconds": metric_data.value,
-                                    "processor": metric_data.processor,
-                                    "model": metric_data.model,
-                                },
-                            }
+                            build_ttfb_metric_event(
+                                ttfb_seconds=metric_data.value,
+                                processor=metric_data.processor,
+                                model=metric_data.model,
+                            )
                        )
        # Handle pipeline errors
        elif isinstance(frame, ErrorFrame):
            processor_name = str(frame.processor) if frame.processor else None
-            payload = {
-                "error": frame.error,
-                "fatal": frame.fatal,
-                "processor": processor_name,
-            }
+            extra_payload: dict[str, object] = {}
            # Surface structured fields when the underlying exception carries
            # them (e.g. google.genai APIError: code=1008, status=None,
            # message="Your project has been denied access...").
            exc = frame.exception
            if exc is not None:
                exc_type = type(exc).__name__
-                payload["exception_type"] = exc_type
-                payload["exception_message"] = str(exc)
+                extra_payload["exception_type"] = exc_type
+                extra_payload["exception_message"] = str(exc)
                for attr in ("code", "status", "message", "details"):
                    value = getattr(exc, attr, None)
-                    if value is None or attr in payload:
+                    if value is None or attr in extra_payload:
                        continue
                    try:
                        # Ensure the value is JSON-serializable; fall back
                        # to str() for opaque objects (e.g. raw response).
                        json.dumps(value)
-                        payload[attr] = value
+                        extra_payload[attr] = value
                    except (TypeError, ValueError):
-                        payload[attr] = str(value)
+                        extra_payload[attr] = str(value)
            await self._send_message(
-                {
-                    "type": RealtimeFeedbackType.PIPELINE_ERROR.value,
-                    "payload": payload,
-                }
+                build_pipeline_error_event(
+                    error=frame.error,
+                    fatal=frame.fatal,
+                    processor=processor_name,
+                    extra_payload=extra_payload or None,
+                )
            )

    async def _send_ws(self, message: dict):
@ -401,14 +383,11 @@ def register_turn_log_handlers(
        logs_buffer.increment_turn()
        try:
            await logs_buffer.append(
-                {
-                    "type": RealtimeFeedbackType.USER_TRANSCRIPTION.value,
-                    "payload": {
-                        "text": message.content,
-                        "final": True,
-                        "timestamp": message.timestamp,
-                    },
-                }
+                build_user_transcription_event(
+                    text=message.content,
+                    final=True,
+                    timestamp=message.timestamp,
+                )
            )
        except Exception as e:
            logger.error(f"Failed to append user turn to logs buffer: {e}")
@ -418,13 +397,10 @@ def register_turn_log_handlers(
        if message.content:
            try:
                await logs_buffer.append(
-                    {
-                        "type": RealtimeFeedbackType.BOT_TEXT.value,
-                        "payload": {
-                            "text": message.content,
-                            "timestamp": message.timestamp,
-                        },
-                    }
+                    build_bot_text_event(
+                        text=message.content,
+                        timestamp=message.timestamp,
+                    )
                )
            except Exception as e:
                logger.error(f"Failed to append assistant turn to logs buffer: {e}")
--- a/api/services/pipecat/run_pipeline.py
+++ b/api/services/pipecat/run_pipeline.py
@ -28,6 +28,9 @@ from api.services.pipecat.pipeline_engine_callbacks_processor import (
 )
 from api.services.pipecat.pipeline_metrics_aggregator import PipelineMetricsAggregator
 from api.services.pipecat.pre_call_fetch import execute_pre_call_fetch
+from api.services.pipecat.realtime_feedback_events import (
+    build_node_transition_event,
+)
 from api.services.pipecat.realtime_feedback_observer import (
    RealtimeFeedbackObserver,
    register_turn_log_handlers,
@ -465,16 +468,13 @@ async def _run_pipeline(
        # Update current node on the buffer so subsequent events are tagged
        in_memory_logs_buffer.set_current_node(node_id, node_name)

-        message = {
-            "type": RealtimeFeedbackType.NODE_TRANSITION.value,
-            "payload": {
-                "node_id": node_id,
-                "node_name": node_name,
-                "previous_node_id": previous_node_id,
-                "previous_node_name": previous_node_name,
-                "allow_interrupt": allow_interrupt,
-            },
-        }
+        message = build_node_transition_event(
+            node_id=node_id,
+            node_name=node_name,
+            previous_node_id=previous_node_id,
+            previous_node_name=previous_node_name,
+            allow_interrupt=allow_interrupt,
+        )
        # Send via WebSocket if available
        if ws_sender:
            try:
--- a/api/services/pipecat/tracing_config.py
+++ b/api/services/pipecat/tracing_config.py
@ -254,6 +254,44 @@ async def handle_langfuse_sync(event):
        unregister_org_langfuse_credentials(org_id)


+def build_remote_parent_context(trace_id: str | None):
+    """Build an OTEL context whose active span carries ``trace_id``.
+
+    Spans started under the returned context join the Langfuse trace identified
+    by ``trace_id`` (Langfuse groups observations by trace id). The parent span
+    id is a non-existent placeholder, so spans created under it attach at the
+    trace root rather than nesting under a real parent span.
+
+    This is the shared primitive behind both post-call QA tracing and text-chat
+    trace stitching. Returns the context, or ``None`` when tracing is
+    unavailable or ``trace_id`` is missing/invalid.
+    """
+    if not trace_id:
+        return None
+    if not ensure_tracing():
+        return None
+    try:
+        from opentelemetry.trace import (
+            NonRecordingSpan,
+            SpanContext,
+            TraceFlags,
+            set_span_in_context,
+        )
+
+        parent_span_context = SpanContext(
+            trace_id=int(trace_id, 16),
+            span_id=0x1,
+            is_remote=True,
+            trace_flags=TraceFlags(0x01),
+        )
+        return set_span_in_context(NonRecordingSpan(parent_span_context))
+    except Exception as e:
+        logger.warning(
+            f"Failed to build remote parent context for trace {trace_id}: {e}"
+        )
+        return None
+
+
 def get_trace_url(trace_id: str, org_id=None) -> str | None:
    """Build a Langfuse trace URL, using org-specific host when available."""
    if org_id is None: