dograh/api/utils/hold_audio.py

"""
Hold audio utility for loading and caching hold music files.

This module provides functionality to load hold music audio files at specific sample rates
with caching to improve performance during multiple calls.
"""

from typing import Dict, Optional, Tuple

import numpy as np
from loguru import logger

try:
    import soundfile as sf
except ModuleNotFoundError as e:
    logger.error(f"Exception: {e}")
    logger.error("In order to use hold audio, you need to `pip install soundfile`.")
    raise Exception(f"Missing module: {e}")


# Global cache for loaded hold music data
_hold_audio_cache: Dict[Tuple[str, int], np.ndarray] = {}


def load_hold_audio(file_path: str, sample_rate: int) -> Optional[bytes]:
    """Load hold music audio file at the specified sample rate with caching.

    Args:
        file_path: Path to the hold music audio file
        sample_rate: Target sample rate (8000 or 16000 Hz supported)

    Returns:
        Audio data as bytes (PCM16) or None if loading failed
    """
    cache_key = (file_path, sample_rate)

    # Check cache first
    if cache_key in _hold_audio_cache:
        logger.debug(f"Using cached hold audio for {file_path} at {sample_rate}Hz")
        audio_data = _hold_audio_cache[cache_key]
        return audio_data.tobytes()

    try:
        logger.info(f"Loading hold audio from {file_path} at {sample_rate}Hz")

        # Load audio file
        sound, file_sample_rate = sf.read(file_path, dtype="int16")
        logger.info(
            f"Audio file loaded - file sample_rate: {file_sample_rate}, target: {sample_rate}"
        )

        # Ensure mono audio (take first channel if stereo)
        if len(sound.shape) > 1:
            sound = sound[:, 0]

        # Resample if needed
        if file_sample_rate != sample_rate:
            logger.warning(
                f"Hold music file has sample rate {file_sample_rate}, expected {sample_rate}"
            )
            # For now, we'll use the audio as-is and let the transport handle resampling
            # In a production system, you might want to use librosa or scipy for proper resampling

        # Convert to int16 and cache
        audio_data = sound.astype(np.int16)
        _hold_audio_cache[cache_key] = audio_data

        logger.info(
            f"Hold audio loaded successfully: {len(audio_data)} samples at {sample_rate}Hz"
        )
        return audio_data.tobytes()

    except Exception as e:
        logger.error(f"Failed to load hold audio file {file_path}: {e}")
        return None


def clear_hold_audio_cache():
    """Clear the hold audio cache to free memory."""
    global _hold_audio_cache
    _hold_audio_cache.clear()
    logger.info("Hold audio cache cleared")


def get_cache_info() -> Dict[str, int]:
    """Get information about the current cache state.

    Returns:
        Dictionary with cache statistics
    """
    return {
        "cached_files": len(_hold_audio_cache),
        "total_cache_size": sum(len(data) for data in _hold_audio_cache.values()),
    }
feat: telephony call transfer (#155) * transfer call * fix: ignore completed call status * chore: refactor telephony * chore: refactor pipecat engine custom tools and other telephony services * chore: code refactor * chore: put back office ambient sound files * chore: remove transport from engine * fix: fix alembic revision * chore: remove set_transferring_call from engine * fix: send OutputAudio frame and let transport chunk it * fix: reinstate docker compose * chore: remove unused transfer-twmil route for caller * chore: update pipecat submodule --------- Co-authored-by: Abhishek Kumar <abhishek@a6k.me> 2026-02-16 14:33:33 +05:30			`"""`
			`Hold audio utility for loading and caching hold music files.`

			`This module provides functionality to load hold music audio files at specific sample rates`
			`with caching to improve performance during multiple calls.`
			`"""`

			`from typing import Dict, Optional, Tuple`

			`import numpy as np`
			`from loguru import logger`

			`try:`
			`import soundfile as sf`
			`except ModuleNotFoundError as e:`
			`logger.error(f"Exception: {e}")`
			logger.error("In order to use hold audio, you need to `pip install soundfile`.")
			`raise Exception(f"Missing module: {e}")`


			`# Global cache for loaded hold music data`
			`_hold_audio_cache: Dict[Tuple[str, int], np.ndarray] = {}`


			`def load_hold_audio(file_path: str, sample_rate: int) -> Optional[bytes]:`
			`"""Load hold music audio file at the specified sample rate with caching.`

			`Args:`
			`file_path: Path to the hold music audio file`
			`sample_rate: Target sample rate (8000 or 16000 Hz supported)`

			`Returns:`
			`Audio data as bytes (PCM16) or None if loading failed`
			`"""`
			`cache_key = (file_path, sample_rate)`

			`# Check cache first`
			`if cache_key in _hold_audio_cache:`
			`logger.debug(f"Using cached hold audio for {file_path} at {sample_rate}Hz")`
			`audio_data = _hold_audio_cache[cache_key]`
			`return audio_data.tobytes()`

			`try:`
			`logger.info(f"Loading hold audio from {file_path} at {sample_rate}Hz")`

			`# Load audio file`
			`sound, file_sample_rate = sf.read(file_path, dtype="int16")`
			`logger.info(`
			`f"Audio file loaded - file sample_rate: {file_sample_rate}, target: {sample_rate}"`
			`)`

			`# Ensure mono audio (take first channel if stereo)`
			`if len(sound.shape) > 1:`
			`sound = sound[:, 0]`

			`# Resample if needed`
			`if file_sample_rate != sample_rate:`
			`logger.warning(`
			`f"Hold music file has sample rate {file_sample_rate}, expected {sample_rate}"`
			`)`
			`# For now, we'll use the audio as-is and let the transport handle resampling`
			`# In a production system, you might want to use librosa or scipy for proper resampling`

			`# Convert to int16 and cache`
			`audio_data = sound.astype(np.int16)`
			`_hold_audio_cache[cache_key] = audio_data`

			`logger.info(`
			`f"Hold audio loaded successfully: {len(audio_data)} samples at {sample_rate}Hz"`
			`)`
			`return audio_data.tobytes()`

			`except Exception as e:`
			`logger.error(f"Failed to load hold audio file {file_path}: {e}")`
			`return None`


			`def clear_hold_audio_cache():`
			`"""Clear the hold audio cache to free memory."""`
			`global _hold_audio_cache`
			`_hold_audio_cache.clear()`
			`logger.info("Hold audio cache cleared")`


			`def get_cache_info() -> Dict[str, int]:`
			`"""Get information about the current cache state.`

			`Returns:`
			`Dictionary with cache statistics`
			`"""`
			`return {`
			`"cached_files": len(_hold_audio_cache),`
			`"total_cache_size": sum(len(data) for data in _hold_audio_cache.values()),`
			`}`