-
Notifications
You must be signed in to change notification settings - Fork 1.5k
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
- Loading branch information
1 parent
01e775d
commit 0402918
Showing
3 changed files
with
96 additions
and
0 deletions.
There are no files selected for viewing
43 changes: 43 additions & 0 deletions
43
apps/setting/models_provider/impl/xf_model_provider/credential/embedding.py
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,43 @@ | ||
# coding=utf-8 | ||
""" | ||
@project: MaxKB | ||
@Author:虎 | ||
@file: embedding.py | ||
@date:2024/10/17 15:40 | ||
@desc: | ||
""" | ||
from typing import Dict | ||
|
||
from common import forms | ||
from common.exception.app_exception import AppApiException | ||
from common.forms import BaseForm | ||
from setting.models_provider.base_model_provider import BaseModelCredential, ValidCode | ||
|
||
|
||
class XFEmbeddingCredential(BaseForm, BaseModelCredential): | ||
|
||
def is_valid(self, model_type: str, model_name, model_credential: Dict[str, object], provider, | ||
raise_exception=False): | ||
model_type_list = provider.get_model_type_list() | ||
if not any(list(filter(lambda mt: mt.get('value') == model_type, model_type_list))): | ||
raise AppApiException(ValidCode.valid_error.value, f'{model_type} 模型类型不支持') | ||
self.valid_form(model_credential) | ||
try: | ||
model = provider.get_model(model_type, model_name, model_credential) | ||
model.embed_query('你好') | ||
except Exception as e: | ||
if isinstance(e, AppApiException): | ||
raise e | ||
if raise_exception: | ||
raise AppApiException(ValidCode.valid_error.value, f'校验失败,请检查参数是否正确: {str(e)}') | ||
else: | ||
return False | ||
return True | ||
|
||
def encryption_dict(self, model: Dict[str, object]): | ||
return model | ||
|
||
base_url = forms.TextInputField('API 域名', required=True, default_value="https://emb-cn-huabei-1.xf-yun.com/") | ||
spark_app_id = forms.TextInputField('APP ID', required=True) | ||
spark_api_key = forms.PasswordInputField("API Key", required=True) | ||
spark_api_secret = forms.PasswordInputField('API Secret', required=True) |
49 changes: 49 additions & 0 deletions
49
apps/setting/models_provider/impl/xf_model_provider/model/embedding.py
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,49 @@ | ||
# coding=utf-8 | ||
""" | ||
@project: MaxKB | ||
@Author:虎 | ||
@file: embedding.py | ||
@date:2024/10/17 15:29 | ||
@desc: | ||
""" | ||
|
||
import base64 | ||
import json | ||
from typing import Dict, Optional | ||
|
||
import numpy as np | ||
from langchain_community.embeddings import SparkLLMTextEmbeddings | ||
from numpy import ndarray | ||
|
||
from setting.models_provider.base_model_provider import MaxKBBaseModel | ||
|
||
|
||
class XFEmbedding(MaxKBBaseModel, SparkLLMTextEmbeddings): | ||
@staticmethod | ||
def new_instance(model_type, model_name, model_credential: Dict[str, object], **model_kwargs): | ||
return XFEmbedding( | ||
spark_app_id=model_credential.get('spark_app_id'), | ||
spark_api_key=model_credential.get('spark_api_key'), | ||
spark_api_secret=model_credential.get('spark_api_secret') | ||
) | ||
|
||
@staticmethod | ||
def _parser_message( | ||
message: str, | ||
) -> Optional[ndarray]: | ||
data = json.loads(message) | ||
code = data["header"]["code"] | ||
if code != 0: | ||
# 这里是讯飞的QPS限制会报错,所以不建议用讯飞的向量模型 | ||
raise Exception(f"Request error: {code}, {data}") | ||
else: | ||
text_base = data["payload"]["feature"]["text"] | ||
text_data = base64.b64decode(text_base) | ||
dt = np.dtype(np.float32) | ||
dt = dt.newbyteorder("<") | ||
text = np.frombuffer(text_data, dtype=dt) | ||
if len(text) > 2560: | ||
array = text[:2560] | ||
else: | ||
array = text | ||
return array |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters