SurfSense/surfsense_backend/app/agents/podcaster/nodes.py

import asyncio
import json
import os
import uuid
from pathlib import Path
from typing import Any

from ffmpeg.asyncio import FFmpeg
from langchain_core.messages import HumanMessage, SystemMessage
from langchain_core.runnables import RunnableConfig
from litellm import aspeech

from app.config import config as app_config
from app.services.kokoro_tts_service import get_kokoro_tts_service
from app.services.llm_service import get_agent_llm

from .configuration import Configuration
from .prompts import get_podcast_generation_prompt
from .state import PodcastTranscriptEntry, PodcastTranscripts, State
from .utils import get_voice_for_provider


async def create_podcast_transcript(
    state: State, config: RunnableConfig
) -> dict[str, Any]:
    """Each node does work."""

    # Get configuration from runnable config
    configuration = Configuration.from_runnable_config(config)
    search_space_id = configuration.search_space_id
    user_prompt = configuration.user_prompt

    # Get search space's document summary LLM
    llm = await get_agent_llm(state.db_session, search_space_id)
    if not llm:
        error_message = (
            f"No document summary LLM configured for search space {search_space_id}"
        )
        print(error_message)
        raise RuntimeError(error_message)

    # Get the prompt
    prompt = get_podcast_generation_prompt(user_prompt)

    # Create the messages
    messages = [
        SystemMessage(content=prompt),
        HumanMessage(
            content=f"<source_content>{state.source_content}</source_content>"
        ),
    ]

    # Generate the podcast transcript
    llm_response = await llm.ainvoke(messages)

    # First try the direct approach
    try:
        podcast_transcript = PodcastTranscripts.model_validate(
            json.loads(llm_response.content)
        )
    except (json.JSONDecodeError, ValueError) as e:
        print(f"Direct JSON parsing failed, trying fallback approach: {e!s}")

        # Fallback: Parse the JSON response manually
        try:
            # Extract JSON content from the response
            content = llm_response.content

            # Find the JSON in the content (handle case where LLM might add additional text)
            json_start = content.find("{")
            json_end = content.rfind("}") + 1
            if json_start >= 0 and json_end > json_start:
                json_str = content[json_start:json_end]

                # Parse the JSON string
                parsed_data = json.loads(json_str)

                # Convert to Pydantic model
                podcast_transcript = PodcastTranscripts.model_validate(parsed_data)

                print("Successfully parsed podcast transcript using fallback approach")
            else:
                # If JSON structure not found, raise a clear error
                error_message = f"Could not find valid JSON in LLM response. Raw response: {content}"
                print(error_message)
                raise ValueError(error_message)

        except (json.JSONDecodeError, ValueError) as e2:
            # Log the error and re-raise it
            error_message = f"Error parsing LLM response (fallback also failed): {e2!s}"
            print(f"Error parsing LLM response: {e2!s}")
            print(f"Raw response: {llm_response.content}")
            raise

    return {"podcast_transcript": podcast_transcript.podcast_transcripts}


async def create_merged_podcast_audio(
    state: State, config: RunnableConfig
) -> dict[str, Any]:
    """Generate audio for each transcript and merge them into a single podcast file."""

    # configuration = Configuration.from_runnable_config(config)

    starting_transcript = PodcastTranscriptEntry(
        speaker_id=1, dialog="Welcome to Surfsense Podcast."
    )

    transcript = state.podcast_transcript

    # Merge the starting transcript with the podcast transcript
    # Check if transcript is a PodcastTranscripts object or already a list
    if hasattr(transcript, "podcast_transcripts"):
        transcript_entries = transcript.podcast_transcripts
    else:
        transcript_entries = transcript

    merged_transcript = [starting_transcript, *transcript_entries]

    # Create a temporary directory for audio files
    temp_dir = Path("temp_audio")
    temp_dir.mkdir(exist_ok=True)

    # Generate a unique session ID for this podcast
    session_id = str(uuid.uuid4())
    output_path = f"podcasts/{session_id}_podcast.mp3"
    os.makedirs("podcasts", exist_ok=True)

    # Generate audio for each transcript segment
    audio_files = []

    async def generate_speech_for_segment(segment, index):
        # Handle both dictionary and PodcastTranscriptEntry objects
        if hasattr(segment, "speaker_id"):
            speaker_id = segment.speaker_id
            dialog = segment.dialog
        else:
            speaker_id = segment.get("speaker_id", 0)
            dialog = segment.get("dialog", "")

        # Select voice based on speaker_id
        voice = get_voice_for_provider(app_config.TTS_SERVICE, speaker_id)

        # Generate a unique filename for this segment
        if app_config.TTS_SERVICE == "local/kokoro":
            # Kokoro generates WAV files
            filename = f"{temp_dir}/{session_id}_{index}.wav"
        else:
            # Other services generate MP3 files
            filename = f"{temp_dir}/{session_id}_{index}.mp3"

        try:
            if app_config.TTS_SERVICE == "local/kokoro":
                # Use Kokoro TTS service
                kokoro_service = await get_kokoro_tts_service(
                    lang_code="a"
                )  # American English
                audio_path = await kokoro_service.generate_speech(
                    text=dialog, voice=voice, speed=1.0, output_path=filename
                )
                return audio_path
            else:
                if app_config.TTS_SERVICE_API_BASE:
                    response = await aspeech(
                        model=app_config.TTS_SERVICE,
                        api_base=app_config.TTS_SERVICE_API_BASE,
                        api_key=app_config.TTS_SERVICE_API_KEY,
                        voice=voice,
                        input=dialog,
                        max_retries=2,
                        timeout=600,
                    )
                else:
                    response = await aspeech(
                        model=app_config.TTS_SERVICE,
                        api_key=app_config.TTS_SERVICE_API_KEY,
                        voice=voice,
                        input=dialog,
                        max_retries=2,
                        timeout=600,
                    )

                # Save the audio to a file - use proper streaming method
                with open(filename, "wb") as f:
                    f.write(response.content)

                return filename
        except Exception as e:
            print(f"Error generating speech for segment {index}: {e!s}")
            raise

    # Generate all audio files concurrently
    tasks = [
        generate_speech_for_segment(segment, i)
        for i, segment in enumerate(merged_transcript)
    ]
    audio_files = await asyncio.gather(*tasks)

    # Merge audio files using ffmpeg
    try:
        # Create FFmpeg instance with the first input
        ffmpeg = FFmpeg().option("y")

        # Add each audio file as input
        for audio_file in audio_files:
            ffmpeg = ffmpeg.input(audio_file)

        # Configure the concatenation and output
        filter_complex = []
        for i in range(len(audio_files)):
            filter_complex.append(f"[{i}:0]")

        filter_complex_str = (
            "".join(filter_complex) + f"concat=n={len(audio_files)}:v=0:a=1[outa]"
        )
        ffmpeg = ffmpeg.option("filter_complex", filter_complex_str)
        ffmpeg = ffmpeg.output(output_path, map="[outa]")

        # Execute FFmpeg
        await ffmpeg.execute()

        print(f"Successfully created podcast audio: {output_path}")

    except Exception as e:
        print(f"Error merging audio files: {e!s}")
        raise
    finally:
        # Clean up temporary files
        for audio_file in audio_files:
            try:
                os.remove(audio_file)
            except Exception as e:
                print(f"Error removing audio file {audio_file}: {e!s}")
                pass

    return {
        "podcast_transcript": merged_transcript,
        "final_podcast_file_path": output_path,
    }
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00			`import asyncio`
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`import json`
			`import os`
			`import uuid`
			`from pathlib import Path`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00			`from typing import Any`
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00			`from ffmpeg.asyncio import FFmpeg`
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`from langchain_core.messages import HumanMessage, SystemMessage`
			`from langchain_core.runnables import RunnableConfig`
			`from litellm import aspeech`

			`from app.config import config as app_config`
$DESKTOP-RTLN3BA\$punk$ feat: Added Local TTS (Kokoro TTS) Support 2025-08-13 17:25:34 -07:00			`from app.services.kokoro_tts_service import get_kokoro_tts_service`
$DESKTOP-RTLN3BA\$punk$ fix: update LLM retrieval in podcast transcript creation to use agent LLM instead of document summary LLM 2026-03-03 13:35:29 -08:00			`from app.services.llm_service import get_agent_llm`
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00			`from .configuration import Configuration`
			`from .prompts import get_podcast_generation_prompt`
			`from .state import PodcastTranscriptEntry, PodcastTranscripts, State`
$DESKTOP-RTLN3BA\$punk$ refactor: integrate voice selection utility in podcast audio generation - remove NavUser component and update sidebar layout; 2025-08-12 16:48:03 -07:00			`from .utils import get_voice_for_provider`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00			`async def create_podcast_transcript(`
			`state: State, config: RunnableConfig`
			`) -> dict[str, Any]:`
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`"""Each node does work."""`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: added configurable LLM's 2025-06-09 15:50:15 -07:00			`# Get configuration from runnable config`
			`configuration = Configuration.from_runnable_config(config)`
$DESKTOP-RTLN3BA\$punk$ feat: moved LLMConfigs from User to SearchSpaces - RBAC soon?? - Updated various services and routes to handle search space-specific LLM preferences. - Modified frontend components to pass search space ID for LLM configuration management. - Removed onboarding page and settings page as part of the refactor. 2025-10-10 00:50:29 -07:00			`search_space_id = configuration.search_space_id`
inject user instruction in the podcast generation task 2025-11-11 20:08:32 +02:00			`user_prompt = configuration.user_prompt`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: migrated to surfsense deep agent 2025-12-23 01:16:25 -08:00			`# Get search space's document summary LLM`
$DESKTOP-RTLN3BA\$punk$ fix: update LLM retrieval in podcast transcript creation to use agent LLM instead of document summary LLM 2026-03-03 13:35:29 -08:00			`llm = await get_agent_llm(state.db_session, search_space_id)`
$DESKTOP-RTLN3BA\$punk$ feat: added configurable LLM's 2025-06-09 15:50:15 -07:00			`if not llm:`
$DESKTOP-RTLN3BA\$punk$ feat: migrated to surfsense deep agent 2025-12-23 01:16:25 -08:00			`error_message = (`
			`f"No document summary LLM configured for search space {search_space_id}"`
			`)`
$DESKTOP-RTLN3BA\$punk$ feat: added configurable LLM's 2025-06-09 15:50:15 -07:00			`print(error_message)`
			`raise RuntimeError(error_message)`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00
fix typo 2025-11-11 19:15:45 +02:00			`# Get the prompt`
inject user instruction in the podcast generation task 2025-11-11 20:08:32 +02:00			`prompt = get_podcast_generation_prompt(user_prompt)`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`# Create the messages`
			`messages = [`
			`SystemMessage(content=prompt),`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00			`HumanMessage(`
			`content=f"<source_content>{state.source_content}</source_content>"`
			`),`
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`]`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`# Generate the podcast transcript`
			`llm_response = await llm.ainvoke(messages)`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`# First try the direct approach`
			`try:`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00			`podcast_transcript = PodcastTranscripts.model_validate(`
			`json.loads(llm_response.content)`
			`)`
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`except (json.JSONDecodeError, ValueError) as e:`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00			`print(f"Direct JSON parsing failed, trying fallback approach: {e!s}")`

$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`# Fallback: Parse the JSON response manually`
			`try:`
			`# Extract JSON content from the response`
			`content = llm_response.content`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`# Find the JSON in the content (handle case where LLM might add additional text)`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00			`json_start = content.find("{")`
			`json_end = content.rfind("}") + 1`
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`if json_start >= 0 and json_end > json_start:`
			`json_str = content[json_start:json_end]`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`# Parse the JSON string`
			`parsed_data = json.loads(json_str)`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`# Convert to Pydantic model`
			`podcast_transcript = PodcastTranscripts.model_validate(parsed_data)`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00
			`print("Successfully parsed podcast transcript using fallback approach")`
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`else:`
			`# If JSON structure not found, raise a clear error`
			`error_message = f"Could not find valid JSON in LLM response. Raw response: {content}"`
			`print(error_message)`
			`raise ValueError(error_message)`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`except (json.JSONDecodeError, ValueError) as e2:`
			`# Log the error and re-raise it`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00			`error_message = f"Error parsing LLM response (fallback also failed): {e2!s}"`
			`print(f"Error parsing LLM response: {e2!s}")`
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`print(f"Raw response: {llm_response.content}")`
			`raise`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00
			`return {"podcast_transcript": podcast_transcript.podcast_transcripts}`


			`async def create_merged_podcast_audio(`
			`state: State, config: RunnableConfig`
			`) -> dict[str, Any]:`
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`"""Generate audio for each transcript and merge them into a single podcast file."""`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00
$DESKTOP-RTLN3BA\$punk$ refactor(ux): Enhance podcast and chat panel features - Updated the welcome dialog in podcast generation to reflect the correct podcast title. - Improved the Dashboard layout by adding an indicator for active chats on the researcher page. - Enhanced the breadcrumb component to fetch and display chat details dynamically. - Adjusted the chat panel width for better visibility. - Introduced animations and improved user interactions in the chat panel and podcast player components. - Updated the ConfigModal to provide clearer instructions for user input. 2025-11-11 18:07:32 -08:00			`# configuration = Configuration.from_runnable_config(config)`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`starting_transcript = PodcastTranscriptEntry(`
$DESKTOP-RTLN3BA\$punk$ refactor(ux): Enhance podcast and chat panel features - Updated the welcome dialog in podcast generation to reflect the correct podcast title. - Improved the Dashboard layout by adding an indicator for active chats on the researcher page. - Enhanced the breadcrumb component to fetch and display chat details dynamically. - Adjusted the chat panel width for better visibility. - Introduced animations and improved user interactions in the chat panel and podcast player components. - Updated the ConfigModal to provide clearer instructions for user input. 2025-11-11 18:07:32 -08:00			`speaker_id=1, dialog="Welcome to Surfsense Podcast."`
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`)`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`transcript = state.podcast_transcript`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`# Merge the starting transcript with the podcast transcript`
			`# Check if transcript is a PodcastTranscripts object or already a list`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00			`if hasattr(transcript, "podcast_transcripts"):`
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`transcript_entries = transcript.podcast_transcripts`
			`else:`
			`transcript_entries = transcript`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00
			`merged_transcript = [starting_transcript, *transcript_entries]`

$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`# Create a temporary directory for audio files`
			`temp_dir = Path("temp_audio")`
			`temp_dir.mkdir(exist_ok=True)`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`# Generate a unique session ID for this podcast`
			`session_id = str(uuid.uuid4())`
			`output_path = f"podcasts/{session_id}_podcast.mp3"`
			`os.makedirs("podcasts", exist_ok=True)`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`# Generate audio for each transcript segment`
			`audio_files = []`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`async def generate_speech_for_segment(segment, index):`
			`# Handle both dictionary and PodcastTranscriptEntry objects`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00			`if hasattr(segment, "speaker_id"):`
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`speaker_id = segment.speaker_id`
			`dialog = segment.dialog`
			`else:`
			`speaker_id = segment.get("speaker_id", 0)`
			`dialog = segment.get("dialog", "")`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`# Select voice based on speaker_id`
$DESKTOP-RTLN3BA\$punk$ refactor: integrate voice selection utility in podcast audio generation - remove NavUser component and update sidebar layout; 2025-08-12 16:48:03 -07:00			`voice = get_voice_for_provider(app_config.TTS_SERVICE, speaker_id)`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`# Generate a unique filename for this segment`
$DESKTOP-RTLN3BA\$punk$ feat: Added Local TTS (Kokoro TTS) Support 2025-08-13 17:25:34 -07:00			`if app_config.TTS_SERVICE == "local/kokoro":`
			`# Kokoro generates WAV files`
			`filename = f"{temp_dir}/{session_id}_{index}.wav"`
			`else:`
			`# Other services generate MP3 files`
			`filename = f"{temp_dir}/{session_id}_{index}.mp3"`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`try:`
$DESKTOP-RTLN3BA\$punk$ feat: Added Local TTS (Kokoro TTS) Support 2025-08-13 17:25:34 -07:00			`if app_config.TTS_SERVICE == "local/kokoro":`
			`# Use Kokoro TTS service`
			`kokoro_service = await get_kokoro_tts_service(`
			`lang_code="a"`
			`) # American English`
			`audio_path = await kokoro_service.generate_speech(`
			`text=dialog, voice=voice, speed=1.0, output_path=filename`
$DESKTOP-RTLN3BA\$punk$ feat: Added Speech to Text support. - Supports audio & video files. - Will be useful for Youtube vids which dont have transcripts. 2025-05-13 21:13:53 -07:00			`)`
$DESKTOP-RTLN3BA\$punk$ feat: Added Local TTS (Kokoro TTS) Support 2025-08-13 17:25:34 -07:00			`return audio_path`
$DESKTOP-RTLN3BA\$punk$ feat: Added Speech to Text support. - Supports audio & video files. - Will be useful for Youtube vids which dont have transcripts. 2025-05-13 21:13:53 -07:00			`else:`
$DESKTOP-RTLN3BA\$punk$ feat: Added Local TTS (Kokoro TTS) Support 2025-08-13 17:25:34 -07:00			`if app_config.TTS_SERVICE_API_BASE:`
			`response = await aspeech(`
			`model=app_config.TTS_SERVICE,`
			`api_base=app_config.TTS_SERVICE_API_BASE,`
			`api_key=app_config.TTS_SERVICE_API_KEY,`
			`voice=voice,`
			`input=dialog,`
			`max_retries=2,`
			`timeout=600,`
			`)`
			`else:`
			`response = await aspeech(`
			`model=app_config.TTS_SERVICE,`
			`api_key=app_config.TTS_SERVICE_API_KEY,`
			`voice=voice,`
			`input=dialog,`
			`max_retries=2,`
			`timeout=600,`
			`)`

			`# Save the audio to a file - use proper streaming method`
			`with open(filename, "wb") as f:`
			`f.write(response.content)`

			`return filename`
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`except Exception as e:`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00			`print(f"Error generating speech for segment {index}: {e!s}")`
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`raise`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`# Generate all audio files concurrently`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00			`tasks = [`
			`generate_speech_for_segment(segment, i)`
			`for i, segment in enumerate(merged_transcript)`
			`]`
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`audio_files = await asyncio.gather(*tasks)`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`# Merge audio files using ffmpeg`
			`try:`
			`# Create FFmpeg instance with the first input`
			`ffmpeg = FFmpeg().option("y")`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`# Add each audio file as input`
			`for audio_file in audio_files:`
			`ffmpeg = ffmpeg.input(audio_file)`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`# Configure the concatenation and output`
			`filter_complex = []`
			`for i in range(len(audio_files)):`
			`filter_complex.append(f"[{i}:0]")`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00
			`filter_complex_str = (`
			`"".join(filter_complex) + f"concat=n={len(audio_files)}:v=0:a=1[outa]"`
			`)`
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`ffmpeg = ffmpeg.option("filter_complex", filter_complex_str)`
			`ffmpeg = ffmpeg.output(output_path, map="[outa]")`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`# Execute FFmpeg`
			`await ffmpeg.execute()`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`print(f"Successfully created podcast audio: {output_path}")`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`except Exception as e:`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00			`print(f"Error merging audio files: {e!s}")`
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`raise`
			`finally:`
			`# Clean up temporary files`
			`for audio_file in audio_files:`
			`try:`
			`os.remove(audio_file)`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00			`except Exception as e:`
			`print(f"Error removing audio file {audio_file}: {e!s}")`
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`pass`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`return {`
			`"podcast_transcript": merged_transcript,`
Fixed all ruff lint and formatting errors 2025-07-24 14:43:48 -07:00			`"final_podcast_file_path": output_path,`
$DESKTOP-RTLN3BA\$punk$ feat: Stable & Hella Fast Podcast Agent with auto FFMPEG handling. 2025-05-05 01:39:31 -07:00			`}`