| 123456789101112131415161718192021222324252627282930313233343536373839 | import iofrom werkzeug.datastructures import FileStoragefrom core.llm.llm_builder import LLMBuilderfrom core.llm.provider.llm_provider_service import LLMProviderServicefrom services.errors.audio import NoAudioUploadedServiceError, AudioTooLargeServiceError, UnsupportedAudioTypeServiceError, ProviderNotSupportSpeechToTextServiceErrorfrom core.llm.whisper import Whisperfrom models.provider import ProviderNameFILE_SIZE = 15FILE_SIZE_LIMIT = FILE_SIZE * 1024 * 1024ALLOWED_EXTENSIONS = ['mp3', 'mp4', 'mpeg', 'mpga', 'm4a', 'wav', 'webm']class AudioService:    @classmethod    def transcript(cls, tenant_id: str, file: FileStorage):        if file is None:            raise NoAudioUploadedServiceError()                extension = file.mimetype        if extension not in [f'audio/{ext}' for ext in ALLOWED_EXTENSIONS]:            raise UnsupportedAudioTypeServiceError()        file_content = file.read()        file_size = len(file_content)        if file_size > FILE_SIZE_LIMIT:            message = f"Audio size larger than {FILE_SIZE} mb"            raise AudioTooLargeServiceError(message)                provider_name = LLMBuilder.get_default_provider(tenant_id, 'whisper-1')        if provider_name != ProviderName.OPENAI.value:            raise ProviderNotSupportSpeechToTextServiceError()        provider_service = LLMProviderService(tenant_id, provider_name)        buffer = io.BytesIO(file_content)        buffer.name = 'temp.mp3'        return Whisper(provider_service.provider).transcribe(buffer)
 |