123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183 |
- import logging
- from flask import request
- from flask_restful import Resource, reqparse # type: ignore
- from werkzeug.exceptions import InternalServerError
- import services
- from controllers.console import api
- from controllers.console.app.error import (
- AppUnavailableError,
- AudioTooLargeError,
- CompletionRequestError,
- NoAudioUploadedError,
- ProviderModelCurrentlyNotSupportError,
- ProviderNotInitializeError,
- ProviderNotSupportSpeechToTextError,
- ProviderQuotaExceededError,
- UnsupportedAudioTypeError,
- )
- from controllers.console.app.wraps import get_app_model
- from controllers.console.wraps import account_initialization_required, setup_required
- from core.errors.error import ModelCurrentlyNotSupportError, ProviderTokenNotInitError, QuotaExceededError
- from core.model_runtime.errors.invoke import InvokeError
- from libs.login import login_required
- from models import App, AppMode
- from services.audio_service import AudioService
- from services.errors.audio import (
- AudioTooLargeServiceError,
- NoAudioUploadedServiceError,
- ProviderNotSupportSpeechToTextServiceError,
- UnsupportedAudioTypeServiceError,
- )
- class ChatMessageAudioApi(Resource):
- @setup_required
- @login_required
- @account_initialization_required
- @get_app_model(mode=[AppMode.CHAT, AppMode.AGENT_CHAT, AppMode.ADVANCED_CHAT])
- def post(self, app_model):
- file = request.files["file"]
- try:
- response = AudioService.transcript_asr(
- app_model=app_model,
- file=file,
- end_user=None,
- )
- return response
- except services.errors.app_model_config.AppModelConfigBrokenError:
- logging.exception("App model config broken.")
- raise AppUnavailableError()
- except NoAudioUploadedServiceError:
- raise NoAudioUploadedError()
- except AudioTooLargeServiceError as e:
- raise AudioTooLargeError(str(e))
- except UnsupportedAudioTypeServiceError:
- raise UnsupportedAudioTypeError()
- except ProviderNotSupportSpeechToTextServiceError:
- raise ProviderNotSupportSpeechToTextError()
- except ProviderTokenNotInitError as ex:
- raise ProviderNotInitializeError(ex.description)
- except QuotaExceededError:
- raise ProviderQuotaExceededError()
- except ModelCurrentlyNotSupportError:
- raise ProviderModelCurrentlyNotSupportError()
- except InvokeError as e:
- raise CompletionRequestError(e.description)
- except ValueError as e:
- raise e
- except Exception as e:
- logging.exception("Failed to handle post request to ChatMessageAudioApi")
- raise InternalServerError()
- class ChatMessageTextApi(Resource):
- @setup_required
- @login_required
- @account_initialization_required
- @get_app_model
- def post(self, app_model: App):
- from werkzeug.exceptions import InternalServerError
- try:
- parser = reqparse.RequestParser()
- parser.add_argument("message_id", type=str, location="json")
- parser.add_argument("text", type=str, location="json")
- parser.add_argument("voice", type=str, location="json")
- parser.add_argument("streaming", type=bool, location="json")
- args = parser.parse_args()
- message_id = args.get("message_id", None)
- text = args.get("text", None)
- if (
- app_model.mode in {AppMode.ADVANCED_CHAT.value, AppMode.WORKFLOW.value}
- and app_model.workflow
- and app_model.workflow.features_dict
- ):
- text_to_speech = app_model.workflow.features_dict.get("text_to_speech")
- if text_to_speech is None:
- raise ValueError("TTS is not enabled")
- voice = args.get("voice") or text_to_speech.get("voice")
- else:
- try:
- if app_model.app_model_config is None:
- raise ValueError("AppModelConfig not found")
- voice = args.get("voice") or app_model.app_model_config.text_to_speech_dict.get("voice")
- except Exception:
- voice = None
- response = AudioService.transcript_tts(app_model=app_model, text=text, message_id=message_id, voice=voice)
- return response
- except services.errors.app_model_config.AppModelConfigBrokenError:
- logging.exception("App model config broken.")
- raise AppUnavailableError()
- except NoAudioUploadedServiceError:
- raise NoAudioUploadedError()
- except AudioTooLargeServiceError as e:
- raise AudioTooLargeError(str(e))
- except UnsupportedAudioTypeServiceError:
- raise UnsupportedAudioTypeError()
- except ProviderNotSupportSpeechToTextServiceError:
- raise ProviderNotSupportSpeechToTextError()
- except ProviderTokenNotInitError as ex:
- raise ProviderNotInitializeError(ex.description)
- except QuotaExceededError:
- raise ProviderQuotaExceededError()
- except ModelCurrentlyNotSupportError:
- raise ProviderModelCurrentlyNotSupportError()
- except InvokeError as e:
- raise CompletionRequestError(e.description)
- except ValueError as e:
- raise e
- except Exception as e:
- logging.exception("Failed to handle post request to ChatMessageTextApi")
- raise InternalServerError()
- class TextModesApi(Resource):
- @setup_required
- @login_required
- @account_initialization_required
- @get_app_model
- def get(self, app_model):
- try:
- parser = reqparse.RequestParser()
- parser.add_argument("language", type=str, required=True, location="args")
- args = parser.parse_args()
- response = AudioService.transcript_tts_voices(
- tenant_id=app_model.tenant_id,
- language=args["language"],
- )
- return response
- except services.errors.audio.ProviderNotSupportTextToSpeechLanageServiceError:
- raise AppUnavailableError("Text to audio voices language parameter loss.")
- except NoAudioUploadedServiceError:
- raise NoAudioUploadedError()
- except AudioTooLargeServiceError as e:
- raise AudioTooLargeError(str(e))
- except UnsupportedAudioTypeServiceError:
- raise UnsupportedAudioTypeError()
- except ProviderNotSupportSpeechToTextServiceError:
- raise ProviderNotSupportSpeechToTextError()
- except ProviderTokenNotInitError as ex:
- raise ProviderNotInitializeError(ex.description)
- except QuotaExceededError:
- raise ProviderQuotaExceededError()
- except ModelCurrentlyNotSupportError:
- raise ProviderModelCurrentlyNotSupportError()
- except InvokeError as e:
- raise CompletionRequestError(e.description)
- except ValueError as e:
- raise e
- except Exception as e:
- logging.exception("Failed to handle get request to TextModesApi")
- raise InternalServerError()
- api.add_resource(ChatMessageAudioApi, "/apps/<uuid:app_id>/audio-to-text")
- api.add_resource(ChatMessageTextApi, "/apps/<uuid:app_id>/text-to-audio")
- api.add_resource(TextModesApi, "/apps/<uuid:app_id>/text-to-audio/voices")
|