mirror of
				https://github.com/langgenius/dify.git
				synced 2025-10-31 10:53:02 +00:00 
			
		
		
		
	 06fcc0c650
			
		
	
	
		06fcc0c650
		
			
		
	
	
	
	
		
			
			Co-authored-by: luowei <glpat-EjySCyNjWiLqAED-YmwM> Co-authored-by: crazywoola <427733928@qq.com> Co-authored-by: crazywoola <100913391+crazywoola@users.noreply.github.com>
		
			
				
	
	
		
			132 lines
		
	
	
		
			5.2 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			132 lines
		
	
	
		
			5.2 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| import logging
 | |
| 
 | |
| from flask import request
 | |
| from flask_restful import Resource, reqparse
 | |
| from werkzeug.exceptions import InternalServerError
 | |
| 
 | |
| import services
 | |
| from controllers.service_api import api
 | |
| from controllers.service_api.app.error import (
 | |
|     AppUnavailableError,
 | |
|     AudioTooLargeError,
 | |
|     CompletionRequestError,
 | |
|     NoAudioUploadedError,
 | |
|     ProviderModelCurrentlyNotSupportError,
 | |
|     ProviderNotInitializeError,
 | |
|     ProviderNotSupportSpeechToTextError,
 | |
|     ProviderQuotaExceededError,
 | |
|     UnsupportedAudioTypeError,
 | |
| )
 | |
| from controllers.service_api.wraps import FetchUserArg, WhereisUserArg, validate_app_token
 | |
| from core.errors.error import ModelCurrentlyNotSupportError, ProviderTokenNotInitError, QuotaExceededError
 | |
| from core.model_runtime.errors.invoke import InvokeError
 | |
| from models.model import App, AppMode, EndUser
 | |
| from services.audio_service import AudioService
 | |
| from services.errors.audio import (
 | |
|     AudioTooLargeServiceError,
 | |
|     NoAudioUploadedServiceError,
 | |
|     ProviderNotSupportSpeechToTextServiceError,
 | |
|     UnsupportedAudioTypeServiceError,
 | |
| )
 | |
| 
 | |
| 
 | |
| class AudioApi(Resource):
 | |
|     @validate_app_token(fetch_user_arg=FetchUserArg(fetch_from=WhereisUserArg.FORM))
 | |
|     def post(self, app_model: App, end_user: EndUser):
 | |
|         file = request.files['file']
 | |
| 
 | |
|         try:
 | |
|             response = AudioService.transcript_asr(
 | |
|                 app_model=app_model,
 | |
|                 file=file,
 | |
|                 end_user=end_user
 | |
|             )
 | |
| 
 | |
|             return response
 | |
|         except services.errors.app_model_config.AppModelConfigBrokenError:
 | |
|             logging.exception("App model config broken.")
 | |
|             raise AppUnavailableError()
 | |
|         except NoAudioUploadedServiceError:
 | |
|             raise NoAudioUploadedError()
 | |
|         except AudioTooLargeServiceError as e:
 | |
|             raise AudioTooLargeError(str(e))
 | |
|         except UnsupportedAudioTypeServiceError:
 | |
|             raise UnsupportedAudioTypeError()
 | |
|         except ProviderNotSupportSpeechToTextServiceError:
 | |
|             raise ProviderNotSupportSpeechToTextError()
 | |
|         except ProviderTokenNotInitError as ex:
 | |
|             raise ProviderNotInitializeError(ex.description)
 | |
|         except QuotaExceededError:
 | |
|             raise ProviderQuotaExceededError()
 | |
|         except ModelCurrentlyNotSupportError:
 | |
|             raise ProviderModelCurrentlyNotSupportError()
 | |
|         except InvokeError as e:
 | |
|             raise CompletionRequestError(e.description)
 | |
|         except ValueError as e:
 | |
|             raise e
 | |
|         except Exception as e:
 | |
|             logging.exception("internal server error.")
 | |
|             raise InternalServerError()
 | |
| 
 | |
| 
 | |
| class TextApi(Resource):
 | |
|     @validate_app_token(fetch_user_arg=FetchUserArg(fetch_from=WhereisUserArg.JSON))
 | |
|     def post(self, app_model: App, end_user: EndUser):
 | |
|         try:
 | |
|             parser = reqparse.RequestParser()
 | |
|             parser.add_argument('message_id', type=str, required=False, location='json')
 | |
|             parser.add_argument('voice', type=str, location='json')
 | |
|             parser.add_argument('text', type=str, location='json')
 | |
|             parser.add_argument('streaming', type=bool, location='json')
 | |
|             args = parser.parse_args()
 | |
| 
 | |
|             message_id = args.get('message_id', None)
 | |
|             text = args.get('text', None)
 | |
|             if (app_model.mode in [AppMode.ADVANCED_CHAT.value, AppMode.WORKFLOW.value]
 | |
|                     and app_model.workflow
 | |
|                     and app_model.workflow.features_dict):
 | |
|                 text_to_speech = app_model.workflow.features_dict.get('text_to_speech')
 | |
|                 voice = args.get('voice') if args.get('voice') else text_to_speech.get('voice')
 | |
|             else:
 | |
|                 try:
 | |
|                     voice = args.get('voice') if args.get('voice') else app_model.app_model_config.text_to_speech_dict.get('voice')
 | |
|                 except Exception:
 | |
|                     voice = None
 | |
|             response = AudioService.transcript_tts(
 | |
|                 app_model=app_model,
 | |
|                 message_id=message_id,
 | |
|                 end_user=end_user.external_user_id,
 | |
|                 voice=voice,
 | |
|                 text=text
 | |
|             )
 | |
| 
 | |
|             return response
 | |
|         except services.errors.app_model_config.AppModelConfigBrokenError:
 | |
|             logging.exception("App model config broken.")
 | |
|             raise AppUnavailableError()
 | |
|         except NoAudioUploadedServiceError:
 | |
|             raise NoAudioUploadedError()
 | |
|         except AudioTooLargeServiceError as e:
 | |
|             raise AudioTooLargeError(str(e))
 | |
|         except UnsupportedAudioTypeServiceError:
 | |
|             raise UnsupportedAudioTypeError()
 | |
|         except ProviderNotSupportSpeechToTextServiceError:
 | |
|             raise ProviderNotSupportSpeechToTextError()
 | |
|         except ProviderTokenNotInitError as ex:
 | |
|             raise ProviderNotInitializeError(ex.description)
 | |
|         except QuotaExceededError:
 | |
|             raise ProviderQuotaExceededError()
 | |
|         except ModelCurrentlyNotSupportError:
 | |
|             raise ProviderModelCurrentlyNotSupportError()
 | |
|         except InvokeError as e:
 | |
|             raise CompletionRequestError(e.description)
 | |
|         except ValueError as e:
 | |
|             raise e
 | |
|         except Exception as e:
 | |
|             logging.exception("internal server error.")
 | |
|             raise InternalServerError()
 | |
| 
 | |
| 
 | |
| api.add_resource(AudioApi, '/audio-to-text')
 | |
| api.add_resource(TextApi, '/text-to-audio')
 |