From b519f9208754b85848c5ff6188d951f8e813501e Mon Sep 17 00:00:00 2001 From: ouyangyouzhang Date: Tue, 3 Jun 2025 17:45:32 +0800 Subject: [PATCH] =?UTF-8?q?=E4=BF=AE=E5=A4=8D=E6=84=8F=E5=9B=BE=E8=AF=86?= =?UTF-8?q?=E5=88=AB=E4=B8=AD=E7=9A=84=E5=90=8C=E4=B9=89=E8=AF=8D=E5=A4=84?= =?UTF-8?q?=E7=90=86=E9=80=BB=E8=BE=91=EF=BC=8C=E7=A1=AE=E4=BF=9D=E5=90=8C?= =?UTF-8?q?=E4=B9=89=E8=AF=8D=E5=AD=97=E7=AC=A6=E4=B8=B2=E6=AD=A3=E7=A1=AE?= =?UTF-8?q?=E5=88=86=E5=89=B2=E4=B8=BA=E5=88=97=E8=A1=A8=EF=BC=9B=E6=9B=B4?= =?UTF-8?q?=E6=96=B0=E6=8F=90=E7=A4=BA=E6=A8=A1=E6=9D=BF=EF=BC=8C=E6=98=8E?= =?UTF-8?q?=E7=A1=AE=E8=BE=93=E5=87=BA=E8=A6=81=E6=B1=82=EF=BC=8C=E9=81=BF?= =?UTF-8?q?=E5=85=8D=E5=AF=B9=E5=85=B3=E9=94=AE=E8=AF=8D=E7=9A=84=E8=AF=AF?= =?UTF-8?q?=E8=A7=A3=E5=92=8C=E4=BF=AE=E6=94=B9=E3=80=82?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- rag2_0/intent_recognition/IntentRecognition.py | 2 ++ rag2_0/intent_recognition/PromptTemplates.py | 3 ++- 2 files changed, 4 insertions(+), 1 deletion(-) diff --git a/rag2_0/intent_recognition/IntentRecognition.py b/rag2_0/intent_recognition/IntentRecognition.py index 3a77e3a..f07d86c 100644 --- a/rag2_0/intent_recognition/IntentRecognition.py +++ b/rag2_0/intent_recognition/IntentRecognition.py @@ -210,6 +210,8 @@ class IntentRecognizer: current_key_terms = set() # 添加向量检索结果 for result in vector_results: + if isinstance(result.get('synonymous', []), str): + result['synonymous'] = result['synonymous'].split(';') term = Term( name=result.get('name'), synonymous=result.get('synonymous', []), diff --git a/rag2_0/intent_recognition/PromptTemplates.py b/rag2_0/intent_recognition/PromptTemplates.py index e24156b..5abe18f 100644 --- a/rag2_0/intent_recognition/PromptTemplates.py +++ b/rag2_0/intent_recognition/PromptTemplates.py @@ -15,8 +15,9 @@ extract_nouns_prompt=""" - 软件相关:功能模块/操作步骤/报错提示/扩展名后缀名 - 造价专业:费用类型/计算标准/行业规范 - 电力工程:项目类型/设备型号/工程阶段 -3. 自动展开缩写(如将'导excel'转为'Excel导入') +3. 自动展开缩写(如将'导excel'转为'导入Excel') 4. 严格基于用户问题提取关键词,不要输出与用户问题无关的关键词 +5. 不要擅自揣摩、猜测、推断关键词,不要修改关键的信息(如:粘贴excel->导入excel) 三、输出格式: {output_format}