优化get_retrieve_info方法,调整outputs参数类型为list[dict],增加segmentid_to_title字典以提升内容标题获取逻辑的准确性。
This commit is contained in:
@@ -341,7 +341,7 @@ content: "{content}"
|
|||||||
except Exception as e:
|
except Exception as e:
|
||||||
return -1
|
return -1
|
||||||
|
|
||||||
def get_retrieve_info(self, query: str, outputs: dict, reranker_sorce_info:list) -> tuple:
|
def get_retrieve_info(self, query: str, outputs: list[dict], reranker_sorce_info:list) -> tuple:
|
||||||
"""
|
"""
|
||||||
获取检索信息并计算分数
|
获取检索信息并计算分数
|
||||||
|
|
||||||
@@ -357,6 +357,7 @@ content: "{content}"
|
|||||||
total_score = 0
|
total_score = 0
|
||||||
valid_scores = 0
|
valid_scores = 0
|
||||||
retrieve_title = []
|
retrieve_title = []
|
||||||
|
segmentid_to_title = { result["segment_id"]:result["title"].split("/")[-1] for result in outputs}
|
||||||
|
|
||||||
# 使用线程池并发计算分数
|
# 使用线程池并发计算分数
|
||||||
with ThreadPoolExecutor() as executor:
|
with ThreadPoolExecutor() as executor:
|
||||||
@@ -372,7 +373,7 @@ content: "{content}"
|
|||||||
for future in as_completed(future_to_content):
|
for future in as_completed(future_to_content):
|
||||||
content, segment_id = future_to_content[future]
|
content, segment_id = future_to_content[future]
|
||||||
score = future.result()
|
score = future.result()
|
||||||
content_title = content.split("\n")[0]
|
content_title = segmentid_to_title[segment_id]
|
||||||
|
|
||||||
if score != -1:
|
if score != -1:
|
||||||
max_score = max(max_score, score)
|
max_score = max(max_score, score)
|
||||||
|
|||||||
Reference in New Issue
Block a user