Skip to content

Commit 003f3d1

Browse files
committed
feat: Support Azure embedding model
1 parent 88deeda commit 003f3d1

File tree

3 files changed

+103
-2
lines changed

3 files changed

+103
-2
lines changed

apps/setting/models_provider/impl/azure_model_provider/azure_model_provider.py

Lines changed: 23 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -11,18 +11,39 @@
1111
from common.util.file_util import get_file_content
1212
from setting.models_provider.base_model_provider import IModelProvider, ModelProvideInfo, ModelInfo, \
1313
ModelTypeConst, ModelInfoManage
14+
from setting.models_provider.impl.azure_model_provider.credential.embedding import AzureOpenAIEmbeddingCredential
1415
from setting.models_provider.impl.azure_model_provider.credential.llm import AzureLLMModelCredential
1516
from setting.models_provider.impl.azure_model_provider.model.azure_chat_model import AzureChatModel
17+
from setting.models_provider.impl.azure_model_provider.model.embedding import AzureOpenAIEmbeddingModel
1618
from smartdoc.conf import PROJECT_DIR
1719

1820
base_azure_llm_model_credential = AzureLLMModelCredential()
21+
base_azure_embedding_model_credential = AzureOpenAIEmbeddingCredential()
1922

2023
default_model_info = ModelInfo('Azure OpenAI', '具体的基础模型由部署名决定', ModelTypeConst.LLM,
2124
base_azure_llm_model_credential, AzureChatModel, api_version='2024-02-15-preview'
2225
)
2326

24-
model_info_manage = ModelInfoManage.builder().append_default_model_info(default_model_info).append_model_info(
25-
default_model_info).build()
27+
embedding_model_info = [
28+
ModelInfo('text-embedding-3-large', '具体的基础模型由部署名决定', ModelTypeConst.EMBEDDING,
29+
base_azure_embedding_model_credential, AzureOpenAIEmbeddingModel, api_version='2023-05-15'
30+
),
31+
ModelInfo('text-embedding-3-small', '', ModelTypeConst.EMBEDDING,
32+
base_azure_embedding_model_credential, AzureOpenAIEmbeddingModel, api_version='2023-05-15'
33+
),
34+
ModelInfo('text-embedding-ada-002', '', ModelTypeConst.EMBEDDING,
35+
base_azure_embedding_model_credential, AzureOpenAIEmbeddingModel, api_version='2023-05-15'
36+
),
37+
]
38+
39+
model_info_manage = (
40+
ModelInfoManage.builder()
41+
.append_default_model_info(default_model_info)
42+
.append_model_info(default_model_info)
43+
.append_model_info_list(embedding_model_info)
44+
.append_default_model_info(embedding_model_info[0])
45+
.build()
46+
)
2647

2748

2849
class AzureModelProvider(IModelProvider):
Lines changed: 55 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,55 @@
1+
# coding=utf-8
2+
"""
3+
@project: MaxKB
4+
@Author:虎
5+
@file: llm.py
6+
@date:2024/7/11 17:08
7+
@desc:
8+
"""
9+
from typing import Dict
10+
11+
from langchain_core.messages import HumanMessage
12+
13+
from common import forms
14+
from common.exception.app_exception import AppApiException
15+
from common.forms import BaseForm, TooltipLabel
16+
from setting.models_provider.base_model_provider import BaseModelCredential, ValidCode
17+
18+
19+
20+
class AzureOpenAIEmbeddingCredential(BaseForm, BaseModelCredential):
21+
22+
def is_valid(self, model_type: str, model_name, model_credential: Dict[str, object], provider,
23+
raise_exception=False):
24+
model_type_list = provider.get_model_type_list()
25+
if not any(list(filter(lambda mt: mt.get('value') == model_type, model_type_list))):
26+
raise AppApiException(ValidCode.valid_error.value, f'{model_type} 模型类型不支持')
27+
28+
for key in ['api_base', 'api_key', 'api_version']:
29+
if key not in model_credential:
30+
if raise_exception:
31+
raise AppApiException(ValidCode.valid_error.value, f'{key} 字段为必填字段')
32+
else:
33+
return False
34+
try:
35+
model = provider.get_model(model_type, model_name, model_credential)
36+
model.embed_query('你好')
37+
except Exception as e:
38+
if isinstance(e, AppApiException):
39+
raise e
40+
if raise_exception:
41+
raise AppApiException(ValidCode.valid_error.value, '校验失败,请检查参数是否正确')
42+
else:
43+
return False
44+
45+
return True
46+
47+
def encryption_dict(self, model: Dict[str, object]):
48+
return {**model, 'api_key': super().encryption(model.get('api_key', ''))}
49+
50+
api_version = forms.TextInputField("API 版本 (api_version)", required=True)
51+
52+
api_base = forms.TextInputField('API 域名 (azure_endpoint)', required=True)
53+
54+
api_key = forms.PasswordInputField("API Key (api_key)", required=True)
55+
Lines changed: 25 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,25 @@
1+
# coding=utf-8
2+
"""
3+
@project: MaxKB
4+
@Author:虎
5+
@file: embedding.py
6+
@date:2024/7/12 17:44
7+
@desc:
8+
"""
9+
from typing import Dict
10+
11+
from langchain_openai import AzureOpenAIEmbeddings
12+
13+
from setting.models_provider.base_model_provider import MaxKBBaseModel
14+
15+
16+
class AzureOpenAIEmbeddingModel(MaxKBBaseModel, AzureOpenAIEmbeddings):
17+
@staticmethod
18+
def new_instance(model_type, model_name, model_credential: Dict[str, object], **model_kwargs):
19+
return AzureOpenAIEmbeddings(
20+
model=model_name,
21+
openai_api_key=model_credential.get('api_key'),
22+
azure_endpoint=model_credential.get('api_base'),
23+
openai_api_version=model_credential.get('api_version'),
24+
openai_api_type="azure",
25+
)

0 commit comments

Comments
 (0)