mirror of
https://github.com/MODSetter/SurfSense.git
synced 2026-06-12 20:45:20 +02:00
70 lines
2.6 KiB
Python
70 lines
2.6 KiB
Python
"""Audio-rendering task: RENDERING -> READY.
|
|
|
|
Synthesises and merges the approved transcript, stores the MP3 in the object
|
|
store, and marks the podcast ready. The working directory is stable per podcast
|
|
so a re-render (e.g. after a voice change) reuses the segment cache.
|
|
"""
|
|
|
|
from __future__ import annotations
|
|
|
|
import logging
|
|
import tempfile
|
|
from pathlib import Path
|
|
|
|
from app.celery_app import celery_app
|
|
from app.podcasts.persistence import PodcastRepository
|
|
from app.podcasts.rendering import PodcastRenderer
|
|
from app.podcasts.service import PodcastService, read_spec, read_transcript
|
|
from app.podcasts.storage import store_audio
|
|
from app.podcasts.tts import get_text_to_speech
|
|
from app.podcasts.voices import get_voice_catalog
|
|
from app.tasks.celery_tasks import get_celery_session_maker, run_async_celery_task
|
|
|
|
from .runtime import mark_failed
|
|
|
|
logger = logging.getLogger(__name__)
|
|
|
|
_WORKDIR_BASE = Path(tempfile.gettempdir()) / "surfsense_podcasts"
|
|
|
|
|
|
@celery_app.task(name="podcast.render_audio", bind=True)
|
|
def render_audio_task(self, podcast_id: int) -> dict:
|
|
try:
|
|
return run_async_celery_task(lambda: _render_audio(podcast_id))
|
|
except Exception as exc: # noqa: BLE001 - record and report, never crash worker
|
|
logger.error("Podcast %s render failed: %s", podcast_id, exc)
|
|
run_async_celery_task(lambda: mark_failed(podcast_id, str(exc)))
|
|
return {"status": "failed", "podcast_id": podcast_id}
|
|
|
|
|
|
async def _render_audio(podcast_id: int) -> dict:
|
|
async with get_celery_session_maker()() as session:
|
|
repo = PodcastRepository(session)
|
|
podcast = await repo.get(podcast_id)
|
|
if podcast is None:
|
|
raise ValueError(f"podcast {podcast_id} not found")
|
|
|
|
spec = read_spec(podcast)
|
|
transcript = read_transcript(podcast)
|
|
if spec is None or transcript is None:
|
|
raise ValueError(f"podcast {podcast_id} is missing brief or transcript")
|
|
|
|
renderer = PodcastRenderer(
|
|
tts=get_text_to_speech(), catalog=get_voice_catalog()
|
|
)
|
|
workdir = _WORKDIR_BASE / str(podcast_id)
|
|
workdir.mkdir(parents=True, exist_ok=True)
|
|
rendered = await renderer.render(
|
|
spec=spec, transcript=transcript, workdir=workdir
|
|
)
|
|
|
|
backend_name, key = await store_audio(
|
|
search_space_id=podcast.search_space_id,
|
|
podcast_id=podcast_id,
|
|
data=rendered.data,
|
|
)
|
|
await PodcastService(session).attach_audio(
|
|
podcast, storage_backend=backend_name, storage_key=key
|
|
)
|
|
await session.commit()
|
|
return {"status": "ready", "podcast_id": podcast_id}
|