feat: add rtf in logs

This commit is contained in:
Abhishek Kumar 2026-01-14 18:35:18 +05:30
parent a172db8022
commit d25f898a8f
10 changed files with 284 additions and 23 deletions

View file

@ -611,6 +611,7 @@ async def get_workflow_run(
"initial_context": run.initial_context,
"gathered_context": run.gathered_context,
"call_type": run.call_type,
"logs": run.logs,
}

View file

@ -20,3 +20,4 @@ class WorkflowRunResponseSchema(BaseModel):
initial_context: dict | None = None
gathered_context: dict | None = None
call_type: CallType
logs: Dict[str, Any] | None = None

View file

@ -4,8 +4,9 @@ from api.db import db_client
from api.enums import WorkflowRunState
from api.services.campaign.call_dispatcher import campaign_call_dispatcher
from api.services.pipecat.audio_config import AudioConfig
from api.services.pipecat.audio_transcript_buffers import (
from api.services.pipecat.in_memory_buffers import (
InMemoryAudioBuffer,
InMemoryLogsBuffer,
InMemoryTranscriptBuffer,
)
from api.services.pipecat.pipeline_metrics_aggregator import PipelineMetricsAggregator
@ -46,6 +47,7 @@ def register_transport_event_handlers(
num_channels=num_channels,
)
in_memory_transcript_buffer = InMemoryTranscriptBuffer(workflow_run_id)
in_memory_logs_buffer = InMemoryLogsBuffer(workflow_run_id)
@transport.event_handler("on_client_connected")
async def on_client_connected(transport, participant):
@ -69,7 +71,7 @@ def register_transport_event_handlers(
await task.cancel()
# Return the buffers so they can be passed to other handlers
return in_memory_audio_buffer, in_memory_transcript_buffer
return in_memory_audio_buffer, in_memory_transcript_buffer, in_memory_logs_buffer
def register_task_event_handler(
@ -80,6 +82,7 @@ def register_task_event_handler(
audio_buffer: AudioBufferProcessor,
in_memory_audio_buffer: InMemoryAudioBuffer,
in_memory_transcript_buffer: InMemoryTranscriptBuffer,
in_memory_logs_buffer: InMemoryLogsBuffer,
pipeline_metrics_aggregator: PipelineMetricsAggregator,
):
@task.event_handler("on_pipeline_started")
@ -185,6 +188,22 @@ def register_task_event_handler(
state=WorkflowRunState.COMPLETED.value,
)
# Save real-time feedback logs to workflow run
if not in_memory_logs_buffer.is_empty:
try:
feedback_events = in_memory_logs_buffer.get_events()
await db_client.update_workflow_run(
run_id=workflow_run_id,
logs={"realtime_feedback_events": feedback_events},
)
logger.debug(
f"Saved {len(feedback_events)} feedback events to workflow run logs"
)
except Exception as e:
logger.error(f"Error saving realtime feedback logs: {e}", exc_info=True)
else:
logger.debug("Logs buffer is empty, skipping save")
# Release concurrent slot for campaign calls
if workflow_run and workflow_run.campaign_id:
await campaign_call_dispatcher.release_call_slot(workflow_run_id)

View file

@ -2,6 +2,7 @@ import asyncio
import re
import tempfile
import wave
from datetime import UTC, datetime
from typing import List
from loguru import logger
@ -120,3 +121,41 @@ class InMemoryTranscriptBuffer:
if self._USER_SPEECH_RE.match(line):
return True
return False
class InMemoryLogsBuffer:
"""Buffer real-time feedback events in memory during a call, then save to workflow run logs."""
def __init__(self, workflow_run_id: int):
self._workflow_run_id = workflow_run_id
self._events: List[dict] = []
self._turn_counter = 0
async def append(self, event: dict):
"""Append a feedback event to the buffer with timestamp."""
# Add timestamp and turn tracking
timestamped_event = {
**event,
"timestamp": datetime.now(UTC).isoformat(),
"turn": self._turn_counter,
}
self._events.append(timestamped_event)
logger.trace(
f"Appended event {event.get('type')} to logs buffer for workflow {self._workflow_run_id}"
)
def increment_turn(self):
"""Increment turn counter (called on user transcription completion)."""
self._turn_counter += 1
logger.trace(
f"Incremented turn counter to {self._turn_counter} for workflow {self._workflow_run_id}"
)
def get_events(self) -> List[dict]:
"""Get all events for final storage."""
return self._events
@property
def is_empty(self) -> bool:
"""Check if the buffer is empty."""
return len(self._events) == 0

View file

@ -10,10 +10,13 @@ how base_output.py handles timed frames.
import asyncio
import time
from typing import Awaitable, Callable, Optional, Set
from typing import TYPE_CHECKING, Awaitable, Callable, Optional, Set
from loguru import logger
if TYPE_CHECKING:
from api.services.pipecat.in_memory_buffers import InMemoryLogsBuffer
from pipecat.frames.frames import (
CancelFrame,
EndFrame,
@ -40,14 +43,17 @@ class RealtimeFeedbackObserver(BaseObserver):
def __init__(
self,
ws_sender: Callable[[dict], Awaitable[None]],
logs_buffer: Optional["InMemoryLogsBuffer"] = None,
):
"""
Args:
ws_sender: Async function to send messages over WebSocket.
Expected signature: async def send(message: dict) -> None
logs_buffer: Optional InMemoryLogsBuffer to persist events for post-call analysis.
"""
super().__init__()
self._ws_sender = ws_sender
self._logs_buffer = logs_buffer
self._frames_seen: Set[str] = set()
# Clock/timing for pts-based frames (similar to base_output.py)
@ -167,6 +173,9 @@ class RealtimeFeedbackObserver(BaseObserver):
},
}
)
# Increment turn counter on final user transcription
if self._logs_buffer:
self._logs_buffer.increment_turn()
# Handle bot TTS text - respect pts timing
elif isinstance(frame, TTSTextFrame):
message = {
@ -219,9 +228,17 @@ class RealtimeFeedbackObserver(BaseObserver):
)
async def _send_message(self, message: dict):
"""Send message via WebSocket, handling errors gracefully."""
"""Send message via WebSocket AND append to logs buffer, handling errors gracefully."""
# Send via WebSocket
try:
await self._ws_sender(message)
except Exception as e:
# Log but don't fail - feedback is non-critical
logger.debug(f"Failed to send real-time feedback message: {e}")
# Also append to logs buffer
if self._logs_buffer:
try:
await self._logs_buffer.append(message)
except Exception as e:
logger.error(f"Failed to append to logs buffer: {e}")

View file

@ -566,12 +566,6 @@ async def _run_pipeline(
# Create pipeline task with audio configuration
task = create_pipeline_task(pipeline, workflow_run_id, audio_config)
# Add real-time feedback observer if WebSocket sender is available
ws_sender = get_ws_sender(workflow_run_id)
if ws_sender:
feedback_observer = RealtimeFeedbackObserver(ws_sender=ws_sender)
task.add_observer(feedback_observer)
# Now set the task on the engine
engine.set_task(task)
@ -579,7 +573,7 @@ async def _run_pipeline(
await engine.initialize()
# Register event handlers
in_memory_audio_buffer, in_memory_transcript_buffer = (
in_memory_audio_buffer, in_memory_transcript_buffer, in_memory_logs_buffer = (
register_transport_event_handlers(
task,
transport,
@ -590,6 +584,14 @@ async def _run_pipeline(
)
)
# Add real-time feedback observer if WebSocket sender is available
ws_sender = get_ws_sender(workflow_run_id)
if ws_sender:
feedback_observer = RealtimeFeedbackObserver(
ws_sender=ws_sender, logs_buffer=in_memory_logs_buffer
)
task.add_observer(feedback_observer)
register_task_event_handler(
workflow_run_id,
engine,
@ -598,6 +600,7 @@ async def _run_pipeline(
audio_buffer,
in_memory_audio_buffer,
in_memory_transcript_buffer,
in_memory_logs_buffer,
pipeline_metrics_aggregator,
)

View file

@ -0,0 +1,166 @@
'use client';
import { CheckCircle, MessageSquare, MicOff,Wrench } from 'lucide-react';
import { cn } from '@/lib/utils';
interface RealtimeFeedbackEvent {
type: string;
payload: {
text?: string;
final?: boolean;
user_id?: string;
timestamp?: string;
function_name?: string;
tool_call_id?: string;
result?: string;
};
timestamp: string;
turn: number;
}
export interface WorkflowRunLogs {
realtime_feedback_events?: RealtimeFeedbackEvent[];
}
interface RealtimeFeedbackLogsProps {
logs: WorkflowRunLogs | null;
}
const EventItem = ({ event }: { event: RealtimeFeedbackEvent }) => {
// Function call message - centered
if (event.type === 'rtf-function-call-start' || event.type === 'rtf-function-call-end') {
return (
<div className="flex justify-center">
<div className="px-3 py-1.5 rounded-full text-xs bg-amber-500/10 border border-amber-500/20 inline-flex items-center gap-2">
{event.type === 'rtf-function-call-start' ? (
<Wrench className="h-3 w-3 text-amber-500" />
) : (
<CheckCircle className="h-3 w-3 text-green-500" />
)}
<span className="font-mono text-amber-700 dark:text-amber-400">
{event.payload.function_name}()
</span>
{event.type === 'rtf-function-call-end' && (
<span className="text-muted-foreground"></span>
)}
</div>
</div>
);
}
const isUser = event.type === 'rtf-user-transcription';
// User messages on right, bot messages on left
return (
<div className={cn(
"flex",
isUser ? "justify-end" : "justify-start"
)}>
<div
className={cn(
"max-w-[85%] px-3 py-2 rounded-2xl text-sm",
isUser
? "bg-primary text-primary-foreground rounded-br-md"
: "bg-muted rounded-bl-md"
)}
>
<div className="whitespace-pre-wrap leading-relaxed">{event.payload.text}</div>
</div>
</div>
);
};
function processEvents(events: RealtimeFeedbackEvent[]): RealtimeFeedbackEvent[] {
// Filter out interim transcriptions
const filteredEvents = events.filter(event => {
if (event.type === 'rtf-user-transcription' && !event.payload.final) {
return false;
}
return true;
});
// Combine consecutive rtf-bot-text events by turn
const processed: RealtimeFeedbackEvent[] = [];
let currentBotText: RealtimeFeedbackEvent | null = null;
for (const event of filteredEvents) {
if (event.type === 'rtf-bot-text') {
if (currentBotText && currentBotText.turn === event.turn) {
// Same turn, combine the text
currentBotText.payload.text = (currentBotText.payload.text || '') + ' ' + (event.payload.text || '');
} else {
// Different turn or first bot text
if (currentBotText) {
processed.push(currentBotText);
}
// Deep copy to avoid mutating original event
currentBotText = {
...event,
payload: { ...event.payload }
};
}
} else {
// Not a bot text event
if (currentBotText) {
processed.push(currentBotText);
currentBotText = null;
}
processed.push(event);
}
}
// Don't forget the last bot text if there is one
if (currentBotText) {
processed.push(currentBotText);
}
return processed;
}
export function RealtimeFeedbackLogs({ logs }: RealtimeFeedbackLogsProps) {
const rawEvents = logs?.realtime_feedback_events;
const events = rawEvents ? processEvents(rawEvents) : undefined;
return (
<div className="w-full h-full flex flex-col bg-background border-l border-border">
{/* Header */}
<div className="px-4 py-3 border-b border-border shrink-0">
<div className="flex items-center justify-center gap-2">
<MessageSquare className="h-4 w-4 text-muted-foreground shrink-0" />
<span className="font-medium text-sm whitespace-nowrap">Call Transcript</span>
<div className="flex items-center gap-1 text-xs px-2 py-0.5 rounded-full shrink-0 bg-muted text-muted-foreground">
<MicOff className="h-3 w-3" />
<span>Ended</span>
</div>
</div>
</div>
{/* Messages */}
<div className="flex-1 overflow-y-auto">
{!events || events.length === 0 ? (
<div className="flex flex-col items-center justify-center h-full text-muted-foreground text-sm">
<MessageSquare className="h-10 w-10 mb-4 opacity-30" />
<p className="font-medium">No conversation recorded</p>
<p className="text-xs mt-1 text-center px-4">
Real-time feedback events were not captured for this call
</p>
</div>
) : (
<div className="space-y-3 p-4">
{events.map((event, index) => (
<EventItem key={index} event={event} />
))}
</div>
)}
</div>
{/* Footer with message count */}
{events && events.length > 0 && (
<div className="px-4 py-2 border-t border-border text-xs text-muted-foreground shrink-0">
{events.filter(e => e.type === 'rtf-user-transcription' || e.type === 'rtf-bot-text').length} messages
</div>
)}
</div>
);
}

View file

@ -2,5 +2,6 @@ export * from './ApiKeyErrorDialog';
export * from './AudioControls';
export * from './ConnectionStatus';
export * from './ContextDisplay';
export * from './RealtimeFeedbackLogs';
export * from './RealtimeFeedbackPanel';
export * from './WorkflowConfigErrorDialog'
export * from './WorkflowConfigErrorDialog';

View file

@ -6,6 +6,7 @@ import { useParams } from 'next/navigation';
import { useEffect, useRef, useState } from 'react';
import BrowserCall from '@/app/workflow/[workflowId]/run/[runId]/BrowserCall';
import { RealtimeFeedbackLogs, WorkflowRunLogs } from '@/app/workflow/[workflowId]/run/[runId]/components/RealtimeFeedbackLogs';
import WorkflowLayout from '@/app/workflow/WorkflowLayout';
import { getWorkflowRunApiV1WorkflowWorkflowIdRunsRunIdGet } from '@/client/sdk.gen';
import { MediaPreviewButtons, MediaPreviewDialog } from '@/components/MediaPreviewDialog';
@ -23,6 +24,7 @@ interface WorkflowRunResponse {
recording_url: string | null;
initial_context: Record<string, string | number | boolean | object> | null;
gathered_context: Record<string, string | number | boolean | object> | null;
logs: WorkflowRunLogs | null;
}
function ContextDisplay({ title, context }: { title: string; context: Record<string, string | number | boolean | object> | null }) {
@ -116,6 +118,7 @@ export default function WorkflowRunPage() {
recording_url: response.data?.recording_url ?? null,
initial_context: response.data?.initial_context as Record<string, string> | null ?? null,
gathered_context: response.data?.gathered_context as Record<string, string> | null ?? null,
logs: response.data?.logs as WorkflowRunLogs | null ?? null,
});
};
fetchWorkflowRun();
@ -147,8 +150,10 @@ export default function WorkflowRunPage() {
}
else if (workflowRun?.is_completed) {
returnValue = (
<div className="h-full flex items-center justify-center p-6">
<div className="w-full max-w-4xl space-y-6">
<div className="flex h-full w-full">
{/* Main content - 2/3 width */}
<div className="w-2/3 h-full flex items-center justify-center overflow-y-auto">
<div className="w-full max-w-4xl space-y-6 p-6">
<Card className="border-border">
<CardHeader className="flex flex-row items-center justify-between">
<div className="flex items-center gap-4">
@ -235,17 +240,23 @@ export default function WorkflowRunPage() {
</CardContent>
</Card>
<div className="grid gap-6 md:grid-cols-2">
<ContextDisplay
title="Initial Context"
context={workflowRun?.initial_context}
/>
<ContextDisplay
title="Gathered Context"
context={workflowRun?.gathered_context}
/>
<div className="grid gap-6 md:grid-cols-2">
<ContextDisplay
title="Initial Context"
context={workflowRun?.initial_context}
/>
<ContextDisplay
title="Gathered Context"
context={workflowRun?.gathered_context}
/>
</div>
</div>
</div>
{/* Transcript panel - 1/3 width */}
<div className="w-1/3 h-full shrink-0">
<RealtimeFeedbackLogs logs={workflowRun?.logs} />
</div>
</div>
);
}

View file

@ -964,6 +964,9 @@ export type WorkflowRunResponseSchema = {
[key: string]: unknown;
} | null;
call_type: CallType;
logs?: {
[key: string]: unknown;
} | null;
};
export type WorkflowRunUsageResponse = {