Spaces:
Paused
Paused
lanny xu commited on
Commit ·
450704e
1
Parent(s): 4f5443a
resolve conflict
Browse files- document_processor.py +5 -5
- workflow_nodes.py +2 -2
document_processor.py
CHANGED
|
@@ -139,15 +139,15 @@ class DocumentProcessor:
|
|
| 139 |
print("⚠️ 检索器未初始化")
|
| 140 |
return []
|
| 141 |
|
| 142 |
-
# 1. 初始检索:获取更多候选文档
|
| 143 |
-
initial_docs = self.retriever.
|
| 144 |
|
| 145 |
# 获取更多候选(如果可能)
|
| 146 |
if hasattr(self.retriever, 'search_kwargs'):
|
| 147 |
# 修改检索参数以获取更多结果
|
| 148 |
original_k = self.retriever.search_kwargs.get('k', 4)
|
| 149 |
self.retriever.search_kwargs['k'] = min(rerank_candidates, len(initial_docs))
|
| 150 |
-
candidate_docs = self.retriever.
|
| 151 |
self.retriever.search_kwargs['k'] = original_k # 恢复原设置
|
| 152 |
else:
|
| 153 |
candidate_docs = initial_docs
|
|
@@ -177,8 +177,8 @@ class DocumentProcessor:
|
|
| 177 |
if not self.retriever:
|
| 178 |
return {}
|
| 179 |
|
| 180 |
-
# 原始检索
|
| 181 |
-
original_docs = self.retriever.
|
| 182 |
|
| 183 |
# 增强检索(带重排)
|
| 184 |
enhanced_docs = self.enhanced_retrieve(query, top_k)
|
|
|
|
| 139 |
print("⚠️ 检索器未初始化")
|
| 140 |
return []
|
| 141 |
|
| 142 |
+
# 1. 初始检索:获取更多候选文档 (使用 invoke 替代 get_relevant_documents)
|
| 143 |
+
initial_docs = self.retriever.invoke(query)
|
| 144 |
|
| 145 |
# 获取更多候选(如果可能)
|
| 146 |
if hasattr(self.retriever, 'search_kwargs'):
|
| 147 |
# 修改检索参数以获取更多结果
|
| 148 |
original_k = self.retriever.search_kwargs.get('k', 4)
|
| 149 |
self.retriever.search_kwargs['k'] = min(rerank_candidates, len(initial_docs))
|
| 150 |
+
candidate_docs = self.retriever.invoke(query)
|
| 151 |
self.retriever.search_kwargs['k'] = original_k # 恢复原设置
|
| 152 |
else:
|
| 153 |
candidate_docs = initial_docs
|
|
|
|
| 177 |
if not self.retriever:
|
| 178 |
return {}
|
| 179 |
|
| 180 |
+
# 原始检索 (使用 invoke 替代 get_relevant_documents)
|
| 181 |
+
original_docs = self.retriever.invoke(query)[:top_k]
|
| 182 |
|
| 183 |
# 增强检索(带重排)
|
| 184 |
enhanced_docs = self.enhanced_retrieve(query, top_k)
|
workflow_nodes.py
CHANGED
|
@@ -73,8 +73,8 @@ class WorkflowNodes:
|
|
| 73 |
print("---检索---")
|
| 74 |
question = state["question"]
|
| 75 |
|
| 76 |
-
# 检索
|
| 77 |
-
documents = self.retriever.
|
| 78 |
return {"documents": documents, "question": question}
|
| 79 |
|
| 80 |
def generate(self, state):
|
|
|
|
| 73 |
print("---检索---")
|
| 74 |
question = state["question"]
|
| 75 |
|
| 76 |
+
# 检索 (使用 invoke 替代 get_relevant_documents)
|
| 77 |
+
documents = self.retriever.invoke(question)
|
| 78 |
return {"documents": documents, "question": question}
|
| 79 |
|
| 80 |
def generate(self, state):
|