Du kannst nicht mehr als 25 Themen auswählen Themen müssen mit entweder einem Buchstaben oder einer Ziffer beginnen. Sie können Bindestriche („-“) enthalten und bis zu 35 Zeichen lang sein.

audio.py 5.9KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146
  1. import logging
  2. from flask import request
  3. from flask_restx import Resource, reqparse
  4. from werkzeug.exceptions import InternalServerError
  5. import services
  6. from controllers.service_api import service_api_ns
  7. from controllers.service_api.app.error import (
  8. AppUnavailableError,
  9. AudioTooLargeError,
  10. CompletionRequestError,
  11. NoAudioUploadedError,
  12. ProviderModelCurrentlyNotSupportError,
  13. ProviderNotInitializeError,
  14. ProviderNotSupportSpeechToTextError,
  15. ProviderQuotaExceededError,
  16. UnsupportedAudioTypeError,
  17. )
  18. from controllers.service_api.wraps import FetchUserArg, WhereisUserArg, validate_app_token
  19. from core.errors.error import ModelCurrentlyNotSupportError, ProviderTokenNotInitError, QuotaExceededError
  20. from core.model_runtime.errors.invoke import InvokeError
  21. from models.model import App, EndUser
  22. from services.audio_service import AudioService
  23. from services.errors.audio import (
  24. AudioTooLargeServiceError,
  25. NoAudioUploadedServiceError,
  26. ProviderNotSupportSpeechToTextServiceError,
  27. UnsupportedAudioTypeServiceError,
  28. )
  29. @service_api_ns.route("/audio-to-text")
  30. class AudioApi(Resource):
  31. @service_api_ns.doc("audio_to_text")
  32. @service_api_ns.doc(description="Convert audio to text using speech-to-text")
  33. @service_api_ns.doc(
  34. responses={
  35. 200: "Audio successfully transcribed",
  36. 400: "Bad request - no audio or invalid audio",
  37. 401: "Unauthorized - invalid API token",
  38. 413: "Audio file too large",
  39. 415: "Unsupported audio type",
  40. 500: "Internal server error",
  41. }
  42. )
  43. @validate_app_token(fetch_user_arg=FetchUserArg(fetch_from=WhereisUserArg.FORM))
  44. def post(self, app_model: App, end_user: EndUser):
  45. """Convert audio to text using speech-to-text.
  46. Accepts an audio file upload and returns the transcribed text.
  47. """
  48. file = request.files["file"]
  49. try:
  50. response = AudioService.transcript_asr(app_model=app_model, file=file, end_user=end_user)
  51. return response
  52. except services.errors.app_model_config.AppModelConfigBrokenError:
  53. logging.exception("App model config broken.")
  54. raise AppUnavailableError()
  55. except NoAudioUploadedServiceError:
  56. raise NoAudioUploadedError()
  57. except AudioTooLargeServiceError as e:
  58. raise AudioTooLargeError(str(e))
  59. except UnsupportedAudioTypeServiceError:
  60. raise UnsupportedAudioTypeError()
  61. except ProviderNotSupportSpeechToTextServiceError:
  62. raise ProviderNotSupportSpeechToTextError()
  63. except ProviderTokenNotInitError as ex:
  64. raise ProviderNotInitializeError(ex.description)
  65. except QuotaExceededError:
  66. raise ProviderQuotaExceededError()
  67. except ModelCurrentlyNotSupportError:
  68. raise ProviderModelCurrentlyNotSupportError()
  69. except InvokeError as e:
  70. raise CompletionRequestError(e.description)
  71. except ValueError as e:
  72. raise e
  73. except Exception as e:
  74. logging.exception("internal server error.")
  75. raise InternalServerError()
  76. # Define parser for text-to-audio API
  77. text_to_audio_parser = reqparse.RequestParser()
  78. text_to_audio_parser.add_argument("message_id", type=str, required=False, location="json", help="Message ID")
  79. text_to_audio_parser.add_argument("voice", type=str, location="json", help="Voice to use for TTS")
  80. text_to_audio_parser.add_argument("text", type=str, location="json", help="Text to convert to audio")
  81. text_to_audio_parser.add_argument("streaming", type=bool, location="json", help="Enable streaming response")
  82. @service_api_ns.route("/text-to-audio")
  83. class TextApi(Resource):
  84. @service_api_ns.expect(text_to_audio_parser)
  85. @service_api_ns.doc("text_to_audio")
  86. @service_api_ns.doc(description="Convert text to audio using text-to-speech")
  87. @service_api_ns.doc(
  88. responses={
  89. 200: "Text successfully converted to audio",
  90. 400: "Bad request - invalid parameters",
  91. 401: "Unauthorized - invalid API token",
  92. 500: "Internal server error",
  93. }
  94. )
  95. @validate_app_token(fetch_user_arg=FetchUserArg(fetch_from=WhereisUserArg.JSON))
  96. def post(self, app_model: App, end_user: EndUser):
  97. """Convert text to audio using text-to-speech.
  98. Converts the provided text to audio using the specified voice.
  99. """
  100. try:
  101. args = text_to_audio_parser.parse_args()
  102. message_id = args.get("message_id", None)
  103. text = args.get("text", None)
  104. voice = args.get("voice", None)
  105. response = AudioService.transcript_tts(
  106. app_model=app_model, text=text, voice=voice, end_user=end_user.external_user_id, message_id=message_id
  107. )
  108. return response
  109. except services.errors.app_model_config.AppModelConfigBrokenError:
  110. logging.exception("App model config broken.")
  111. raise AppUnavailableError()
  112. except NoAudioUploadedServiceError:
  113. raise NoAudioUploadedError()
  114. except AudioTooLargeServiceError as e:
  115. raise AudioTooLargeError(str(e))
  116. except UnsupportedAudioTypeServiceError:
  117. raise UnsupportedAudioTypeError()
  118. except ProviderNotSupportSpeechToTextServiceError:
  119. raise ProviderNotSupportSpeechToTextError()
  120. except ProviderTokenNotInitError as ex:
  121. raise ProviderNotInitializeError(ex.description)
  122. except QuotaExceededError:
  123. raise ProviderQuotaExceededError()
  124. except ModelCurrentlyNotSupportError:
  125. raise ProviderModelCurrentlyNotSupportError()
  126. except InvokeError as e:
  127. raise CompletionRequestError(e.description)
  128. except ValueError as e:
  129. raise e
  130. except Exception as e:
  131. logging.exception("internal server error.")
  132. raise InternalServerError()