From adce2a38099ce6a5a51db976a5e0129fdc703211 Mon Sep 17 00:00:00 2001 From: paituo <330435863@qq.com> Date: Tue, 10 Sep 2024 08:42:12 +0800 Subject: [PATCH] =?UTF-8?q?=E6=9B=B4=E6=96=B0xinference=E6=94=AF=E6=8C=81?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- backend/app/settings.py | 9 ++++++--- 1 file changed, 6 insertions(+), 3 deletions(-) diff --git a/backend/app/settings.py b/backend/app/settings.py index 761a8c1..8486e05 100644 --- a/backend/app/settings.py +++ b/backend/app/settings.py @@ -3,15 +3,18 @@ from typing import Dict from abc import abstractmethod from llama_index.core.constants import DEFAULT_TEMPERATURE from llama_index.core.settings import Settings +from llama_index.embeddings.xinference import XinferenceEmbedding from llama_index.llms.xinference import Xinference +#from llama_index.embeddings.xinference import XinferenceEmbedding from llama_index.llms.xinference.base import DEFAULT_XINFERENCE_TEMP +from llama_index.postprocessor.xinference_rerank import XinferenceRerank -from app.xinference.base import XinferenceEmbedding, XinferenceRerank from app.engine.loaders import getProjectInfos from app.api.routers.request.base import ProjectInfo +from modelProvide.customDashScope import CustomDashScope from util.register import * from llama_index.core.callbacks import CallbackManager -from modelProvide.customDashScope import CustomDashScope + ModelPlateCategory = '模型平台' @@ -107,7 +110,7 @@ class XinferencePlatform(ModelPlatform): embed_model_name = os.getenv("EMBEDDING_MODEL") dimensions = os.getenv("EMBEDDING_DIM") dimensions = int(dimensions) if dimensions is not None else None - return XinferenceEmbedding(embed_model_name, embedding_base_url, dimensions=dimensions) + return XinferenceEmbedding(embed_model_name, embedding_base_url) def rerank(self): rerank_model = os.getenv("RERANK_MODEL")