audio.py 4.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122
  1. import logging
  2. from flask import request
  3. from flask_restful import Resource, reqparse
  4. from werkzeug.exceptions import InternalServerError
  5. import services
  6. from controllers.service_api import api
  7. from controllers.service_api.app.error import (
  8. AppUnavailableError,
  9. AudioTooLargeError,
  10. CompletionRequestError,
  11. NoAudioUploadedError,
  12. ProviderModelCurrentlyNotSupportError,
  13. ProviderNotInitializeError,
  14. ProviderNotSupportSpeechToTextError,
  15. ProviderQuotaExceededError,
  16. UnsupportedAudioTypeError,
  17. )
  18. from controllers.service_api.wraps import FetchUserArg, WhereisUserArg, validate_app_token
  19. from core.errors.error import ModelCurrentlyNotSupportError, ProviderTokenNotInitError, QuotaExceededError
  20. from core.model_runtime.errors.invoke import InvokeError
  21. from models.model import App, AppModelConfig, EndUser
  22. from services.audio_service import AudioService
  23. from services.errors.audio import (
  24. AudioTooLargeServiceError,
  25. NoAudioUploadedServiceError,
  26. ProviderNotSupportSpeechToTextServiceError,
  27. UnsupportedAudioTypeServiceError,
  28. )
  29. class AudioApi(Resource):
  30. @validate_app_token(fetch_user_arg=FetchUserArg(fetch_from=WhereisUserArg.FORM))
  31. def post(self, app_model: App, end_user: EndUser):
  32. app_model_config: AppModelConfig = app_model.app_model_config
  33. if not app_model_config.speech_to_text_dict['enabled']:
  34. raise AppUnavailableError()
  35. file = request.files['file']
  36. try:
  37. response = AudioService.transcript_asr(
  38. tenant_id=app_model.tenant_id,
  39. file=file,
  40. end_user=end_user
  41. )
  42. return response
  43. except services.errors.app_model_config.AppModelConfigBrokenError:
  44. logging.exception("App model config broken.")
  45. raise AppUnavailableError()
  46. except NoAudioUploadedServiceError:
  47. raise NoAudioUploadedError()
  48. except AudioTooLargeServiceError as e:
  49. raise AudioTooLargeError(str(e))
  50. except UnsupportedAudioTypeServiceError:
  51. raise UnsupportedAudioTypeError()
  52. except ProviderNotSupportSpeechToTextServiceError:
  53. raise ProviderNotSupportSpeechToTextError()
  54. except ProviderTokenNotInitError as ex:
  55. raise ProviderNotInitializeError(ex.description)
  56. except QuotaExceededError:
  57. raise ProviderQuotaExceededError()
  58. except ModelCurrentlyNotSupportError:
  59. raise ProviderModelCurrentlyNotSupportError()
  60. except InvokeError as e:
  61. raise CompletionRequestError(e.description)
  62. except ValueError as e:
  63. raise e
  64. except Exception as e:
  65. logging.exception("internal server error.")
  66. raise InternalServerError()
  67. class TextApi(Resource):
  68. @validate_app_token(fetch_user_arg=FetchUserArg(fetch_from=WhereisUserArg.JSON, required=True))
  69. def post(self, app_model: App, end_user: EndUser):
  70. parser = reqparse.RequestParser()
  71. parser.add_argument('text', type=str, required=True, nullable=False, location='json')
  72. parser.add_argument('streaming', type=bool, required=False, nullable=False, location='json')
  73. args = parser.parse_args()
  74. try:
  75. response = AudioService.transcript_tts(
  76. tenant_id=app_model.tenant_id,
  77. text=args['text'],
  78. end_user=end_user,
  79. voice=args['voice'] if args['voice'] else app_model.app_model_config.text_to_speech_dict.get('voice'),
  80. streaming=args['streaming']
  81. )
  82. return response
  83. except services.errors.app_model_config.AppModelConfigBrokenError:
  84. logging.exception("App model config broken.")
  85. raise AppUnavailableError()
  86. except NoAudioUploadedServiceError:
  87. raise NoAudioUploadedError()
  88. except AudioTooLargeServiceError as e:
  89. raise AudioTooLargeError(str(e))
  90. except UnsupportedAudioTypeServiceError:
  91. raise UnsupportedAudioTypeError()
  92. except ProviderNotSupportSpeechToTextServiceError:
  93. raise ProviderNotSupportSpeechToTextError()
  94. except ProviderTokenNotInitError as ex:
  95. raise ProviderNotInitializeError(ex.description)
  96. except QuotaExceededError:
  97. raise ProviderQuotaExceededError()
  98. except ModelCurrentlyNotSupportError:
  99. raise ProviderModelCurrentlyNotSupportError()
  100. except InvokeError as e:
  101. raise CompletionRequestError(e.description)
  102. except ValueError as e:
  103. raise e
  104. except Exception as e:
  105. logging.exception("internal server error.")
  106. raise InternalServerError()
  107. api.add_resource(AudioApi, '/audio-to-text')
  108. api.add_resource(TextApi, '/text-to-audio')