优化get_retrieve_info方法,调整outputs参数类型为list[dict],增加segmentid_to_title字典以提升内容标题获取逻辑的准确性。

This commit is contained in:
2025-07-02 13:34:06 +08:00
parent d811ae411f
commit d835439fea
+3 -2
View File
@@ -341,7 +341,7 @@ content: "{content}"
except Exception as e:
return -1
def get_retrieve_info(self, query: str, outputs: dict, reranker_sorce_info:list) -> tuple:
def get_retrieve_info(self, query: str, outputs: list[dict], reranker_sorce_info:list) -> tuple:
"""
获取检索信息并计算分数
@@ -357,6 +357,7 @@ content: "{content}"
total_score = 0
valid_scores = 0
retrieve_title = []
segmentid_to_title = { result["segment_id"]:result["title"].split("/")[-1] for result in outputs}
# 使用线程池并发计算分数
with ThreadPoolExecutor() as executor:
@@ -372,7 +373,7 @@ content: "{content}"
for future in as_completed(future_to_content):
content, segment_id = future_to_content[future]
score = future.result()
content_title = content.split("\n")[0]
content_title = segmentid_to_title[segment_id]
if score != -1:
max_score = max(max_score, score)