diff --git a/api/db/services/dialog_service.py b/api/db/services/dialog_service.py index e56b131..a5d15c3 100644 --- a/api/db/services/dialog_service.py +++ b/api/db/services/dialog_service.py @@ -495,8 +495,10 @@ def ask(question, kb_ids, tenant_id): max_tokens = chat_mdl.max_length # 获取所有知识库的租户ID并去重 tenant_ids = list(set([kb.tenant_id for kb in kbs])) + # 设置更小的相似度阈值以适配更好的效果(原始值0.1) + similarity_threshold = 0.01 # 调用检索器检索相关文档片段 - kbinfos = retriever.retrieval(question, embd_mdl, tenant_ids, kb_ids, 1, 12, 0.1, 0.3, aggs=False, rank_feature=label_question(question, kbs)) + kbinfos = retriever.retrieval(question, embd_mdl, tenant_ids, kb_ids, 1, 12, similarity_threshold, 0.3, aggs=False, rank_feature=label_question(question, kbs)) # 将检索结果格式化为提示词,并确保不超过模型最大token限制 knowledges = kb_prompt(kbinfos, max_tokens) prompt = """ diff --git a/docker/docker-compose.yml b/docker/docker-compose.yml index ee9aec8..11dd245 100644 --- a/docker/docker-compose.yml +++ b/docker/docker-compose.yml @@ -18,6 +18,7 @@ services: - ./nginx/proxy.conf:/etc/nginx/proxy.conf - ./nginx/nginx.conf:/etc/nginx/nginx.conf - ../api/db/services/database.py:/ragflow/api/db/services/database.py + - ../api/db/services/dialog_service.py:/ragflow/api/db/services/dialog_service.py env_file: .env environment: - TZ=${TIMEZONE} diff --git a/docker/docker-compose_gpu.yml b/docker/docker-compose_gpu.yml index 9dcd6bd..a1c0ed4 100644 --- a/docker/docker-compose_gpu.yml +++ b/docker/docker-compose_gpu.yml @@ -18,6 +18,7 @@ services: - ./nginx/proxy.conf:/etc/nginx/proxy.conf - ./nginx/nginx.conf:/etc/nginx/nginx.conf - ../api/db/services/database.py:/ragflow/api/db/services/database.py + - ../api/db/services/dialog_service.py:/ragflow/api/db/services/dialog_service.py env_file: .env environment: - TZ=${TIMEZONE}