更新LlamaIndex版本库

This commit is contained in:
wanyaokun
2024-09-10 14:07:52 +08:00
parent 6f5548ee61
commit a165d55822
4 changed files with 80 additions and 7 deletions
+2 -2
View File
@@ -52,8 +52,8 @@ def get_chat_engine(filters=None, params:dict=None):
description=tree_summary_query_engine_tool_messages)
tools.append(query_engine_tool)
tools.append(query_engine_tool_1)
tools.append(summary_query_tool)
#tools.append(query_engine_tool_1)
#tools.append(summary_query_tool)
# Add additional tools
tools += ToolFactory.from_env()
+72
View File
@@ -0,0 +1,72 @@
from llama_index.llms.xinference import Xinference
from typing import Any, Callable, Dict, Optional, Sequence, Tuple
from llama_index.core.llms.callbacks import (
llm_chat_callback,
llm_completion_callback,
)
from llama_index.core.base.llms.types import (
ChatMessage,
ChatResponse,
ChatResponseGen,
CompletionResponse,
CompletionResponseGen,
LLMMetadata,
MessageRole,
)
from llama_index.llms.xinference.utils import (
xinference_message_to_history,
xinference_modelname_to_contextsize,
)
class XinfengModel(Xinference):
@llm_chat_callback()
def chat(self, messages: Sequence[ChatMessage], **kwargs: Any) -> ChatResponse:
assert self._generator is not None
response_text = self._generator.chat(
messages=messages,
generate_config={
"stream": False,
"temperature": self.temperature,
"max_tokens": self.max_tokens,
},
)["choices"][0]["message"]["content"]
return ChatResponse(
message=ChatMessage(
role=MessageRole.ASSISTANT,
content=response_text,
),
delta=None,
)
@llm_chat_callback()
def stream_chat(
self, messages: Sequence[ChatMessage], **kwargs: Any
) -> ChatResponseGen:
msgs = []
for message in messages:
msgs.append(message.dict())
assert self._generator is not None
response_iter = self._generator.chat(
messages=msgs,
generate_config={
"stream": True,
"temperature": self.temperature,
"max_tokens": self.max_tokens,
},
)
def gen() -> ChatResponseGen:
text = ""
for c in response_iter:
delta = c["choices"][0]["delta"].get("content", "")
text += delta
yield ChatResponse(
message=ChatMessage(
role=MessageRole.ASSISTANT,
content=text,
),
delta=delta,
)
return gen()
@@ -5,7 +5,7 @@ from llama_index.core.callbacks.base import CallbackManager
from llama_index.core.indices.prompt_helper import PromptHelper
from llama_index.core.prompts import BasePromptTemplate
from llama_index.core.service_context import ServiceContext
from llama_index.core.service_context_elements.llm_predictor import LLMPredictorType
from llama_index.core.llms import LLM
from llama_index.core.types import BaseModel,RESPONSE_TEXT_TYPE
from llama_index.core.async_utils import run_async_tasks
from llama_index.core.utils import get_tokenizer
@@ -14,7 +14,7 @@ from llama_index.core.prompts.prompt_utils import get_empty_prompt_txt
class CustomTreeResponse(TreeSummarize):
def __init__(
self,
llm: Optional[LLMPredictorType] = None,
llm: Optional[LLM] = None,
callback_manager: Optional[CallbackManager] = None,
prompt_helper: Optional[PromptHelper] = None,
summary_template: Optional[BasePromptTemplate] = None,