feat: add audio transcription functionality to ETL pipeline

2026-05-09 15:52:40 +02:00 · 2026-04-05 17:26:03 +05:30 · 2026-04-05 17:26:03 +05:30 · 02fc6f1d16
commit 02fc6f1d16
parent 5d22349dc1
2 changed files with 34 additions and 0 deletions
--- a/surfsense_backend/app/etl_pipeline/parsers/init.py
+++ b/surfsense_backend/app/etl_pipeline/parsers/init.py
--- a/surfsense_backend/app/etl_pipeline/parsers/audio.py
+++ b/surfsense_backend/app/etl_pipeline/parsers/audio.py
@ -0,0 +1,34 @@
 from litellm import atranscription
 from app.config import config as app_config
 async def transcribe_audio(file_path: str, filename: str) -> str:
    stt_service_type = (
        "local"
        if app_config.STT_SERVICE and app_config.STT_SERVICE.startswith("local/")
        else "external"
    )
    if stt_service_type == "local":
        from app.services.stt_service import stt_service
        result = stt_service.transcribe_file(file_path)
        text = result.get("text", "")
        if not text:
            raise ValueError("Transcription returned empty text")
    else:
        with open(file_path, "rb") as audio_file:
            kwargs: dict = {
                "model": app_config.STT_SERVICE,
                "file": audio_file,
                "api_key": app_config.STT_SERVICE_API_KEY,
            }
            if app_config.STT_SERVICE_API_BASE:
                kwargs["api_base"] = app_config.STT_SERVICE_API_BASE
            response = await atranscription(**kwargs)
            text = response.get("text", "")
            if not text:
                raise ValueError("Transcription returned empty text")
    return f"# Transcription of {filename}\n\n{text}"