1
0
mirror of https://github.com/ijaric/voice_assistant.git synced 2025-05-24 14:33:26 +00:00
voice_assistant/src/assistant/lib/stt/repositories.py
2023-10-09 21:09:52 +03:00

48 lines
1.8 KiB
Python

import mimetypes
import tempfile
import magic
import openai
import lib.app.settings as app_settings
import lib.stt as stt
class OpenaiSpeechRepository:
def __init__(self, settings: app_settings.Settings):
self.settings = settings
openai.api_key = self.settings.openai.api_key.get_secret_value()
@staticmethod
def __get_file_extension_from_bytes(audio: bytes) -> str | None:
mime: magic.Magic = magic.Magic(mime=True)
mime_type: str = mime.from_buffer(audio)
extension: str | None = mimetypes.guess_extension(mime_type)
if extension:
extension = extension.replace(".", "")
return extension
async def speech_to_text(self, audio: bytes) -> str:
file_extension = self.__get_file_extension_from_bytes(audio)
if not file_extension:
raise ValueError("File extension is not supported")
voice: stt.models.SttVoice = stt.models.SttVoice(
audio_size=len(audio) // 1024, # audio size in MB,
audio_format=file_extension,
audio_data=audio,
voice_settings=self.settings.voice,
)
try:
with tempfile.NamedTemporaryFile(suffix=f".{file_extension}") as temp_file:
temp_file.write(voice.audio_data)
temp_file.seek(0)
transcript = openai.Audio.transcribe(self.settings.openai.stt_model, temp_file) # type: ignore
except openai.error.InvalidRequestError as e: # type: ignore[reportGeneralTypeIssues]
raise ValueError(f"OpenAI API error: {e}")
except openai.error.OpenAIError as e: # type: ignore[reportGeneralTypeIssues]
raise ValueError(f"OpenAI API error: {e}")
return transcript.text # type: ignore[reportUnknownVariableType]