fix: changes to update pipecat version to 0.0.100 (#122)

* feat: add stt evals * add smart turn as provider * chore: remove deprecations * chore: format files * fix: remove deprecated UserIdleProcessor * fix: remove deprecated TranscriptProcessor * chore: update pipecat submodule * feat: add evals visualisation * fix: trigger llm generation on client connected and pipeline started * chore: update pipecat * chore: update pipecat submodule * Add tests * fix: slow loading of workflow page * chore: update pipecat submodule * Show version after release * Fixes #99 * fix: provider check for websocket connection * Fixes #107 * Fix #96 * chore: fix documentation * fix: cloudonix campaign call error --------- Co-authored-by: Sabiha Khan <sabihak89@gmail.com>
2026-06-28 08:49:42 +02:00 · 2026-01-23 18:53:59 +05:30 · 2026-01-23 18:53:59 +05:30 · 911c5ed416
commit 911c5ed416
parent a4367bd83b
104 changed files with 16919 additions and 597 deletions
--- a/api/tasks/arq.py
+++ b/api/tasks/arq.py
@ -49,8 +49,7 @@ from api.tasks.campaign_tasks import (
 from api.tasks.knowledge_base_processing import process_knowledge_base_document
 from api.tasks.run_integrations import run_integrations_post_workflow_run
 from api.tasks.s3_upload import (
-    upload_audio_to_s3,
-    upload_transcript_to_s3,
+    process_workflow_completion,
    upload_voicemail_audio_to_s3,
 )

@ -59,9 +58,8 @@ class WorkerSettings:
    functions = [
        calculate_workflow_run_cost,
        run_integrations_post_workflow_run,
-        upload_audio_to_s3,
-        upload_transcript_to_s3,
        upload_voicemail_audio_to_s3,
+        process_workflow_completion,
        sync_campaign_source,
        process_campaign_batch,
        monitor_campaign_progress,
--- a/api/tasks/function_names.py
+++ b/api/tasks/function_names.py
@ -1,8 +1,7 @@
 class FunctionNames:
    CALCULATE_WORKFLOW_RUN_COST = "calculate_workflow_run_cost"
    RUN_INTEGRATIONS_POST_WORKFLOW_RUN = "run_integrations_post_workflow_run"
-    UPLOAD_AUDIO_TO_S3 = "upload_audio_to_s3"
-    UPLOAD_TRANSCRIPT_TO_S3 = "upload_transcript_to_s3"
+    PROCESS_WORKFLOW_COMPLETION = "process_workflow_completion"
    UPLOAD_VOICEMAIL_AUDIO_TO_S3 = "upload_voicemail_audio_to_s3"
    SYNC_CAMPAIGN_SOURCE = "sync_campaign_source"
    PROCESS_CAMPAIGN_BATCH = "process_campaign_batch"
--- a/api/tasks/run_integrations.py
+++ b/api/tasks/run_integrations.py
@ -1,10 +1,11 @@
 """Execute webhook integrations after workflow run completion."""

-from typing import Any, Dict
+from typing import Any, Dict, Optional

 import httpx
 from loguru import logger

+from api.constants import BACKEND_API_ENDPOINT
 from api.db import db_client
 from api.db.models import WorkflowRunModel
 from api.utils.credential_auth import build_auth_header
@ -54,10 +55,13 @@ async def run_integrations_post_workflow_run(_ctx, workflow_run_id: int):

        logger.info(f"Found {len(webhook_nodes)} webhook nodes to execute")

-        # Step 4: Build render context
-        render_context = _build_render_context(workflow_run)
+        # Step 4: Generate public access token (on-demand, only when webhooks exist)
+        public_token = await db_client.ensure_public_access_token(workflow_run_id)

-        # Step 5: Execute each webhook node
+        # Step 5: Build render context
+        render_context = _build_render_context(workflow_run, public_token)
+
+        # Step 6: Execute each webhook node
        for node in webhook_nodes:
            webhook_data = node.get("data", {})
            try:
@ -77,9 +81,19 @@ async def run_integrations_post_workflow_run(_ctx, workflow_run_id: int):
        raise


-def _build_render_context(workflow_run: WorkflowRunModel) -> Dict[str, Any]:
-    """Build the context dict for template rendering."""
-    return {
+def _build_render_context(
+    workflow_run: WorkflowRunModel, public_token: Optional[str] = None
+) -> Dict[str, Any]:
+    """Build the context dict for template rendering.
+
+    Args:
+        workflow_run: The workflow run model
+        public_token: Optional public access token for download URLs
+
+    Returns:
+        Dict containing all fields available for template rendering
+    """
+    context = {
        # Top-level fields
        "workflow_run_id": workflow_run.id,
        "workflow_run_name": workflow_run.name,
@ -89,10 +103,25 @@ def _build_render_context(workflow_run: WorkflowRunModel) -> Dict[str, Any]:
        "initial_context": workflow_run.initial_context or {},
        "gathered_context": workflow_run.gathered_context or {},
        "cost_info": workflow_run.usage_info or {},
-        "recording_url": getattr(workflow_run, "recording_url", None),
-        "transcript_url": getattr(workflow_run, "transcript_url", None),
    }

+    # Add public download URLs if token is available
+    if public_token:
+        base_url = (
+            f"{BACKEND_API_ENDPOINT}/api/v1/public/download/workflow/{public_token}"
+        )
+        context["recording_url"] = (
+            f"{base_url}/recording" if workflow_run.recording_url else None
+        )
+        context["transcript_url"] = (
+            f"{base_url}/transcript" if workflow_run.transcript_url else None
+        )
+    else:
+        context["recording_url"] = workflow_run.recording_url
+        context["transcript_url"] = workflow_run.transcript_url
+
+    return context
+

 async def _execute_webhook_node(
    webhook_data: Dict[str, Any],
--- a/api/tasks/s3_upload.py
+++ b/api/tasks/s3_upload.py
@ -1,129 +1,27 @@
 import os
+from typing import Optional

 from loguru import logger
-from pipecat.utils.context import set_current_run_id

 from api.db import db_client
 from api.services.storage import get_current_storage_backend, storage_fs
-
-
-async def upload_audio_to_s3(ctx, workflow_run_id: int, temp_file_path: str):
-    """Upload audio file from temp path to S3."""
-    run_id = str(workflow_run_id)
-    set_current_run_id(run_id)
-
-    logger.info(f"Starting audio upload to S3 from {temp_file_path}")
-
-    try:
-        # Verify temp file exists
-        if not os.path.exists(temp_file_path):
-            logger.error(f"Temp audio file not found: {temp_file_path}")
-            raise FileNotFoundError(f"Temp audio file not found: {temp_file_path}")
-
-        file_size = os.path.getsize(temp_file_path)
-        logger.debug(f"Audio file size: {file_size} bytes")
-
-        recording_url = f"recordings/{workflow_run_id}.wav"
-        storage_backend = get_current_storage_backend()
-
-        logger.info(
-            f"UPLOAD: Using {storage_backend.name} (value: {storage_backend.value}) for audio upload - workflow_run_id: {workflow_run_id}"
-        )
-
-        await storage_fs.aupload_file(temp_file_path, recording_url)
-
-        # Update DB with recording URL and storage backend
-        await db_client.update_workflow_run(
-            run_id=workflow_run_id,
-            recording_url=recording_url,
-            storage_backend=storage_backend.value,
-        )
-
-        logger.info(
-            f"Successfully uploaded audio to {storage_backend.name}: {recording_url} (stored backend: {storage_backend.name})"
-        )
-
-    except Exception as e:
-        logger.error(f"Error uploading audio to S3 for workflow {workflow_run_id}: {e}")
-        raise
-    finally:
-        # Clean up temp file
-        if os.path.exists(temp_file_path):
-            try:
-                os.remove(temp_file_path)
-                logger.debug(f"Cleaned up temp audio file: {temp_file_path}")
-            except Exception as e:
-                logger.warning(
-                    f"Failed to clean up temp audio file {temp_file_path}: {e}"
-                )
-
-
-async def upload_transcript_to_s3(ctx, workflow_run_id: int, temp_file_path: str):
-    """Upload transcript file from temp path to S3."""
-    run_id = str(workflow_run_id)
-    set_current_run_id(run_id)
-
-    logger.info(f"Starting transcript upload to S3 from {temp_file_path}")
-
-    try:
-        # Verify temp file exists
-        if not os.path.exists(temp_file_path):
-            logger.error(f"Temp transcript file not found: {temp_file_path}")
-            raise FileNotFoundError(f"Temp transcript file not found: {temp_file_path}")
-
-        file_size = os.path.getsize(temp_file_path)
-        logger.debug(f"Transcript file size: {file_size} bytes")
-
-        transcript_url = f"transcripts/{workflow_run_id}.txt"
-        storage_backend = get_current_storage_backend()
-
-        logger.info(
-            f"UPLOAD: Using {storage_backend.name} (value: {storage_backend.value}) for transcript upload - workflow_run_id: {workflow_run_id}"
-        )
-
-        await storage_fs.aupload_file(temp_file_path, transcript_url)
-
-        # Update DB with transcript URL and storage backend
-        await db_client.update_workflow_run(
-            run_id=workflow_run_id,
-            transcript_url=transcript_url,
-            storage_backend=storage_backend.value,
-        )
-
-        logger.info(
-            f"Successfully uploaded transcript to {storage_backend.name}: {transcript_url} (stored backend: {storage_backend.name})"
-        )
-
-    except Exception as e:
-        logger.error(
-            f"Error uploading transcript to S3 for workflow {workflow_run_id}: {e}"
-        )
-        raise
-    finally:
-        # Clean up temp file
-        if os.path.exists(temp_file_path):
-            try:
-                os.remove(temp_file_path)
-                logger.debug(f"Cleaned up temp transcript file: {temp_file_path}")
-            except Exception as e:
-                logger.warning(
-                    f"Failed to clean up temp transcript file {temp_file_path}: {e}"
-                )
+from api.tasks.run_integrations import run_integrations_post_workflow_run
+from pipecat.utils.context import set_current_run_id


 async def upload_voicemail_audio_to_s3(
-    ctx,
+    _ctx,
    workflow_run_id: int,
    temp_file_path: str,
    s3_key: str,
 ):
    """Upload voicemail detection audio from temp file to S3.

-    This function is similar to upload_audio_to_s3 but handles voicemail-specific
-    paths and doesn't update the workflow run's recording_url field.
+    Handles voicemail-specific paths and doesn't update the workflow run's
+    recording_url field.

    Args:
-        ctx: ARQ context
+        _ctx: ARQ context (unused)
        workflow_run_id: The workflow run ID
        temp_file_path: Path to the temporary WAV file
        s3_key: The S3 key where the file should be uploaded
@ -161,7 +59,7 @@ async def upload_voicemail_audio_to_s3(
        )
        raise
    finally:
-        # Clean up temp file (same pattern as upload_audio_to_s3)
+        # Clean up temp file
        if os.path.exists(temp_file_path):
            try:
                os.remove(temp_file_path)
@ -170,3 +68,104 @@ async def upload_voicemail_audio_to_s3(
                logger.warning(
                    f"Failed to clean up temp voicemail audio file {temp_file_path}: {e}"
                )
+
+
+async def process_workflow_completion(
+    _ctx,
+    workflow_run_id: int,
+    audio_temp_path: Optional[str] = None,
+    transcript_temp_path: Optional[str] = None,
+):
+    """Process workflow completion: upload artifacts and run integrations.
+
+    This task combines audio upload, transcript upload, and webhook integrations
+    into a single sequential task to ensure integrations run after uploads complete.
+
+    Args:
+        _ctx: ARQ context (unused)
+        workflow_run_id: The workflow run ID
+        audio_temp_path: Optional path to temp audio file
+        transcript_temp_path: Optional path to temp transcript file
+    """
+    run_id = str(workflow_run_id)
+    set_current_run_id(run_id)
+
+    logger.info(f"Processing workflow completion for run {workflow_run_id}")
+
+    storage_backend = get_current_storage_backend()
+
+    # Step 1: Upload audio if provided
+    if audio_temp_path:
+        try:
+            if os.path.exists(audio_temp_path):
+                file_size = os.path.getsize(audio_temp_path)
+                logger.debug(f"Audio file size: {file_size} bytes")
+
+                recording_url = f"recordings/{workflow_run_id}.wav"
+                logger.info(
+                    f"Uploading audio to {storage_backend.name} - workflow_run_id: {workflow_run_id}"
+                )
+
+                await storage_fs.aupload_file(audio_temp_path, recording_url)
+                await db_client.update_workflow_run(
+                    run_id=workflow_run_id,
+                    recording_url=recording_url,
+                    storage_backend=storage_backend.value,
+                )
+                logger.info(f"Successfully uploaded audio: {recording_url}")
+            else:
+                logger.warning(f"Audio temp file not found: {audio_temp_path}")
+        except Exception as e:
+            logger.error(f"Error uploading audio for workflow {workflow_run_id}: {e}")
+        finally:
+            if audio_temp_path and os.path.exists(audio_temp_path):
+                try:
+                    os.remove(audio_temp_path)
+                    logger.debug(f"Cleaned up temp audio file: {audio_temp_path}")
+                except Exception as e:
+                    logger.warning(f"Failed to clean up temp audio file: {e}")
+
+    # Step 2: Upload transcript if provided
+    if transcript_temp_path:
+        try:
+            if os.path.exists(transcript_temp_path):
+                file_size = os.path.getsize(transcript_temp_path)
+                logger.debug(f"Transcript file size: {file_size} bytes")
+
+                transcript_url = f"transcripts/{workflow_run_id}.txt"
+                logger.info(
+                    f"Uploading transcript to {storage_backend.name} - workflow_run_id: {workflow_run_id}"
+                )
+
+                await storage_fs.aupload_file(transcript_temp_path, transcript_url)
+                await db_client.update_workflow_run(
+                    run_id=workflow_run_id,
+                    transcript_url=transcript_url,
+                    storage_backend=storage_backend.value,
+                )
+                logger.info(f"Successfully uploaded transcript: {transcript_url}")
+            else:
+                logger.warning(
+                    f"Transcript temp file not found: {transcript_temp_path}"
+                )
+        except Exception as e:
+            logger.error(
+                f"Error uploading transcript for workflow {workflow_run_id}: {e}"
+            )
+        finally:
+            if transcript_temp_path and os.path.exists(transcript_temp_path):
+                try:
+                    os.remove(transcript_temp_path)
+                    logger.debug(
+                        f"Cleaned up temp transcript file: {transcript_temp_path}"
+                    )
+                except Exception as e:
+                    logger.warning(f"Failed to clean up temp transcript file: {e}")
+
+    # Step 3: Run webhook integrations (after uploads are complete)
+    try:
+        await run_integrations_post_workflow_run(_ctx, workflow_run_id)
+    except Exception as e:
+        logger.error(f"Error running integrations for workflow {workflow_run_id}: {e}")
+
+    logger.info(f"Completed workflow completion processing for run {workflow_run_id}")