forked from langgenius/dify
-
Notifications
You must be signed in to change notification settings - Fork 0
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Feat/chat support voice input (langgenius#532)
- Loading branch information
Showing
22 changed files
with
501 additions
and
5 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,69 @@ | ||
# -*- coding:utf-8 -*- | ||
import logging | ||
|
||
from flask import request | ||
from flask_login import login_required | ||
from werkzeug.exceptions import InternalServerError, NotFound | ||
|
||
import services | ||
from controllers.console import api | ||
from controllers.console.app import _get_app | ||
from controllers.console.app.error import AppUnavailableError, \ | ||
ProviderNotInitializeError, CompletionRequestError, ProviderQuotaExceededError, \ | ||
ProviderModelCurrentlyNotSupportError, NoAudioUploadedError, AudioTooLargeError, \ | ||
UnsupportedAudioTypeError, ProviderNotSupportSpeechToTextError | ||
from controllers.console.setup import setup_required | ||
from controllers.console.wraps import account_initialization_required | ||
from core.llm.error import LLMBadRequestError, LLMAPIUnavailableError, LLMAuthorizationError, LLMAPIConnectionError, \ | ||
LLMRateLimitError, ProviderTokenNotInitError, QuotaExceededError, ModelCurrentlyNotSupportError | ||
from flask_restful import Resource | ||
from services.audio_service import AudioService | ||
from services.errors.audio import NoAudioUploadedServiceError, AudioTooLargeServiceError, \ | ||
UnsupportedAudioTypeServiceError, ProviderNotSupportSpeechToTextServiceError | ||
|
||
|
||
class ChatMessageAudioApi(Resource): | ||
@setup_required | ||
@login_required | ||
@account_initialization_required | ||
def post(self, app_id): | ||
app_id = str(app_id) | ||
app_model = _get_app(app_id, 'chat') | ||
|
||
file = request.files['file'] | ||
|
||
try: | ||
response = AudioService.transcript( | ||
tenant_id=app_model.tenant_id, | ||
file=file, | ||
) | ||
|
||
return response | ||
except services.errors.app_model_config.AppModelConfigBrokenError: | ||
logging.exception("App model config broken.") | ||
raise AppUnavailableError() | ||
except NoAudioUploadedServiceError: | ||
raise NoAudioUploadedError() | ||
except AudioTooLargeServiceError as e: | ||
raise AudioTooLargeError(str(e)) | ||
except UnsupportedAudioTypeServiceError: | ||
raise UnsupportedAudioTypeError() | ||
except ProviderNotSupportSpeechToTextServiceError: | ||
raise ProviderNotSupportSpeechToTextError() | ||
except ProviderTokenNotInitError: | ||
raise ProviderNotInitializeError() | ||
except QuotaExceededError: | ||
raise ProviderQuotaExceededError() | ||
except ModelCurrentlyNotSupportError: | ||
raise ProviderModelCurrentlyNotSupportError() | ||
except (LLMBadRequestError, LLMAPIConnectionError, LLMAPIUnavailableError, | ||
LLMRateLimitError, LLMAuthorizationError) as e: | ||
raise CompletionRequestError(str(e)) | ||
except ValueError as e: | ||
raise e | ||
except Exception as e: | ||
logging.exception("internal server error.") | ||
raise InternalServerError() | ||
|
||
|
||
api.add_resource(ChatMessageAudioApi, '/apps/<uuid:app_id>/audio-to-text') |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,66 @@ | ||
# -*- coding:utf-8 -*- | ||
import logging | ||
|
||
from flask import request | ||
from werkzeug.exceptions import InternalServerError | ||
|
||
import services | ||
from controllers.console import api | ||
from controllers.console.app.error import AppUnavailableError, ProviderNotInitializeError, \ | ||
ProviderQuotaExceededError, ProviderModelCurrentlyNotSupportError, CompletionRequestError, \ | ||
NoAudioUploadedError, AudioTooLargeError, \ | ||
UnsupportedAudioTypeError, ProviderNotSupportSpeechToTextError | ||
from controllers.console.explore.wraps import InstalledAppResource | ||
from core.llm.error import LLMBadRequestError, LLMAPIUnavailableError, LLMAuthorizationError, LLMAPIConnectionError, \ | ||
LLMRateLimitError, ProviderTokenNotInitError, QuotaExceededError, ModelCurrentlyNotSupportError | ||
from services.audio_service import AudioService | ||
from services.errors.audio import NoAudioUploadedServiceError, AudioTooLargeServiceError, \ | ||
UnsupportedAudioTypeServiceError, ProviderNotSupportSpeechToTextServiceError | ||
from models.model import AppModelConfig | ||
|
||
|
||
class ChatAudioApi(InstalledAppResource): | ||
def post(self, installed_app): | ||
app_model = installed_app.app | ||
app_model_config: AppModelConfig = app_model.app_model_config | ||
|
||
if not app_model_config.speech_to_text_dict['enabled']: | ||
raise AppUnavailableError() | ||
|
||
file = request.files['file'] | ||
|
||
try: | ||
response = AudioService.transcript( | ||
tenant_id=app_model.tenant_id, | ||
file=file, | ||
) | ||
|
||
return response | ||
except services.errors.app_model_config.AppModelConfigBrokenError: | ||
logging.exception("App model config broken.") | ||
raise AppUnavailableError() | ||
except NoAudioUploadedServiceError: | ||
raise NoAudioUploadedError() | ||
except AudioTooLargeServiceError as e: | ||
raise AudioTooLargeError(str(e)) | ||
except UnsupportedAudioTypeServiceError: | ||
raise UnsupportedAudioTypeError() | ||
except ProviderNotSupportSpeechToTextServiceError: | ||
raise ProviderNotSupportSpeechToTextError() | ||
except ProviderTokenNotInitError: | ||
raise ProviderNotInitializeError() | ||
except QuotaExceededError: | ||
raise ProviderQuotaExceededError() | ||
except ModelCurrentlyNotSupportError: | ||
raise ProviderModelCurrentlyNotSupportError() | ||
except (LLMBadRequestError, LLMAPIConnectionError, LLMAPIUnavailableError, | ||
LLMRateLimitError, LLMAuthorizationError) as e: | ||
raise CompletionRequestError(str(e)) | ||
except ValueError as e: | ||
raise e | ||
except Exception as e: | ||
logging.exception("internal server error.") | ||
raise InternalServerError() | ||
|
||
|
||
api.add_resource(ChatAudioApi, '/installed-apps/<uuid:installed_app_id>/audio-to-text', endpoint='installed_app_audio') |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,61 @@ | ||
import logging | ||
|
||
from flask import request | ||
from werkzeug.exceptions import InternalServerError | ||
|
||
import services | ||
from controllers.service_api import api | ||
from controllers.service_api.app.error import AppUnavailableError, ProviderNotInitializeError, CompletionRequestError, ProviderQuotaExceededError, \ | ||
ProviderModelCurrentlyNotSupportError, NoAudioUploadedError, AudioTooLargeError, UnsupportedAudioTypeError, \ | ||
ProviderNotSupportSpeechToTextError | ||
from controllers.service_api.wraps import AppApiResource | ||
from core.llm.error import LLMBadRequestError, LLMAuthorizationError, LLMAPIUnavailableError, LLMAPIConnectionError, \ | ||
LLMRateLimitError, ProviderTokenNotInitError, QuotaExceededError, ModelCurrentlyNotSupportError | ||
from models.model import App, AppModelConfig | ||
from services.audio_service import AudioService | ||
from services.errors.audio import NoAudioUploadedServiceError, AudioTooLargeServiceError, \ | ||
UnsupportedAudioTypeServiceError, ProviderNotSupportSpeechToTextServiceError | ||
|
||
class AudioApi(AppApiResource): | ||
def post(self, app_model: App, end_user): | ||
app_model_config: AppModelConfig = app_model.app_model_config | ||
|
||
if not app_model_config.speech_to_text_dict['enabled']: | ||
raise AppUnavailableError() | ||
|
||
file = request.files['file'] | ||
|
||
try: | ||
response = AudioService.transcript( | ||
tenant_id=app_model.tenant_id, | ||
file=file, | ||
) | ||
|
||
return response | ||
except services.errors.app_model_config.AppModelConfigBrokenError: | ||
logging.exception("App model config broken.") | ||
raise AppUnavailableError() | ||
except NoAudioUploadedServiceError: | ||
raise NoAudioUploadedError() | ||
except AudioTooLargeServiceError as e: | ||
raise AudioTooLargeError(str(e)) | ||
except UnsupportedAudioTypeServiceError: | ||
raise UnsupportedAudioTypeError() | ||
except ProviderNotSupportSpeechToTextServiceError: | ||
raise ProviderNotSupportSpeechToTextError() | ||
except ProviderTokenNotInitError: | ||
raise ProviderNotInitializeError() | ||
except QuotaExceededError: | ||
raise ProviderQuotaExceededError() | ||
except ModelCurrentlyNotSupportError: | ||
raise ProviderModelCurrentlyNotSupportError() | ||
except (LLMBadRequestError, LLMAPIConnectionError, LLMAPIUnavailableError, | ||
LLMRateLimitError, LLMAuthorizationError) as e: | ||
raise CompletionRequestError(str(e)) | ||
except ValueError as e: | ||
raise e | ||
except Exception as e: | ||
logging.exception("internal server error.") | ||
raise InternalServerError() | ||
|
||
api.add_resource(AudioApi, '/audio-to-text') |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Oops, something went wrong.