2024-12-31 01:52:16 -07:00
|
|
|
"""Audio conversion service"""
|
2024-12-31 01:57:00 -07:00
|
|
|
|
2024-12-31 01:52:16 -07:00
|
|
|
from io import BytesIO
|
2024-12-31 02:55:51 -07:00
|
|
|
|
2024-12-31 01:52:16 -07:00
|
|
|
import numpy as np
|
|
|
|
import soundfile as sf
|
2024-12-31 02:55:51 -07:00
|
|
|
from loguru import logger
|
2024-12-31 01:52:16 -07:00
|
|
|
|
2024-12-31 01:57:00 -07:00
|
|
|
|
2024-12-31 01:52:16 -07:00
|
|
|
class AudioService:
|
|
|
|
"""Service for audio format conversions"""
|
2024-12-31 01:57:00 -07:00
|
|
|
|
2024-12-31 01:52:16 -07:00
|
|
|
@staticmethod
|
2024-12-31 01:57:00 -07:00
|
|
|
def convert_audio(
|
|
|
|
audio_data: np.ndarray, sample_rate: int, output_format: str
|
|
|
|
) -> bytes:
|
2024-12-31 01:52:16 -07:00
|
|
|
"""Convert audio data to specified format
|
2024-12-31 01:57:00 -07:00
|
|
|
|
2024-12-31 01:52:16 -07:00
|
|
|
Args:
|
|
|
|
audio_data: Numpy array of audio samples
|
|
|
|
sample_rate: Sample rate of the audio
|
2025-01-01 21:11:23 +05:30
|
|
|
output_format: Target format (wav, mp3, opus, flac, pcm)
|
2024-12-31 01:57:00 -07:00
|
|
|
|
2024-12-31 01:52:16 -07:00
|
|
|
Returns:
|
|
|
|
Bytes of the converted audio
|
|
|
|
"""
|
|
|
|
buffer = BytesIO()
|
2024-12-31 01:57:00 -07:00
|
|
|
|
2024-12-31 01:52:16 -07:00
|
|
|
try:
|
2024-12-31 01:57:00 -07:00
|
|
|
if output_format == "wav":
|
2024-12-31 01:52:16 -07:00
|
|
|
logger.info("Writing to WAV format...")
|
2025-01-01 21:11:23 +05:30
|
|
|
# Ensure audio_data is in int16 format for WAV
|
2025-01-02 15:36:53 -07:00
|
|
|
audio_data_wav = (
|
|
|
|
audio_data / np.abs(audio_data).max() * np.iinfo(np.int16).max
|
|
|
|
).astype(np.int16) # Normalize
|
2025-01-01 21:11:23 +05:30
|
|
|
sf.write(buffer, audio_data_wav, sample_rate, format="WAV")
|
2024-12-31 01:57:00 -07:00
|
|
|
elif output_format == "mp3":
|
2024-12-31 01:52:16 -07:00
|
|
|
logger.info("Converting to MP3 format...")
|
2025-01-01 21:11:23 +05:30
|
|
|
# soundfile can write MP3 if ffmpeg or libsox is installed
|
|
|
|
sf.write(buffer, audio_data, sample_rate, format="MP3")
|
2024-12-31 01:57:00 -07:00
|
|
|
elif output_format == "opus":
|
2024-12-31 01:52:16 -07:00
|
|
|
logger.info("Converting to Opus format...")
|
2025-01-01 21:11:23 +05:30
|
|
|
sf.write(buffer, audio_data, sample_rate, format="OGG", subtype="OPUS")
|
2024-12-31 01:57:00 -07:00
|
|
|
elif output_format == "flac":
|
2024-12-31 01:52:16 -07:00
|
|
|
logger.info("Converting to FLAC format...")
|
2025-01-01 21:11:23 +05:30
|
|
|
sf.write(buffer, audio_data, sample_rate, format="FLAC")
|
2024-12-31 01:57:00 -07:00
|
|
|
elif output_format == "pcm":
|
2025-01-01 21:11:23 +05:30
|
|
|
logger.info("Extracting PCM data...")
|
|
|
|
# Ensure audio_data is in int16 format for PCM
|
2025-01-02 15:36:53 -07:00
|
|
|
audio_data_pcm = (
|
|
|
|
audio_data / np.abs(audio_data).max() * np.iinfo(np.int16).max
|
|
|
|
).astype(np.int16) # Normalize
|
2025-01-01 21:11:23 +05:30
|
|
|
buffer.write(audio_data_pcm.tobytes())
|
2024-12-31 01:52:16 -07:00
|
|
|
else:
|
2024-12-31 01:57:00 -07:00
|
|
|
raise ValueError(
|
2025-01-01 21:11:23 +05:30
|
|
|
f"Format {output_format} not supported. Supported formats are: wav, mp3, opus, flac, pcm."
|
2024-12-31 01:57:00 -07:00
|
|
|
)
|
|
|
|
|
2025-01-01 21:11:23 +05:30
|
|
|
buffer.seek(0)
|
|
|
|
return buffer.getvalue()
|
|
|
|
|
2024-12-31 01:52:16 -07:00
|
|
|
except Exception as e:
|
|
|
|
logger.error(f"Error converting audio to {output_format}: {str(e)}")
|
|
|
|
raise ValueError(f"Failed to convert audio to {output_format}: {str(e)}")
|