MrSimple07 commited on
Commit
8d71306
·
1 Parent(s): 29f19c8

bm25 full corpuse + COMPACT + NodePostprocessor

Browse files
Files changed (1) hide show
  1. index_retriever.py +9 -6
index_retriever.py CHANGED
@@ -14,33 +14,36 @@ def create_vector_index(documents):
14
 
15
  def create_query_engine(vector_index):
16
  try:
 
 
 
17
  bm25_retriever = BM25Retriever.from_defaults(
18
  docstore=vector_index.docstore,
19
- nodes=vector_index.get_nodes(), # <-- add this line
20
- similarity_top_k=20
21
  )
22
 
23
  vector_retriever = VectorIndexRetriever(
24
  index=vector_index,
25
  similarity_top_k=30,
26
- similarity_cutoff=0.7
27
  )
28
 
29
  hybrid_retriever = QueryFusionRetriever(
30
  [vector_retriever, bm25_retriever],
31
  similarity_top_k=40,
32
- num_queries=1
33
  )
34
 
35
  custom_prompt_template = PromptTemplate(PROMPT_SIMPLE_POISK)
36
  response_synthesizer = get_response_synthesizer(
37
  response_mode=ResponseMode.COMPACT,
38
- text_qa_template=custom_prompt_template
39
  )
40
 
41
  query_engine = RetrieverQueryEngine(
42
  retriever=hybrid_retriever,
43
- response_synthesizer=response_synthesizer
44
  )
45
 
46
  log_message("Query engine успешно создан")
 
14
 
15
  def create_query_engine(vector_index):
16
  try:
17
+ # ✅ Get all nodes from docstore instead of vector_index.get_nodes()
18
+ all_nodes = list(vector_index.docstore.get_all_nodes().values())
19
+
20
  bm25_retriever = BM25Retriever.from_defaults(
21
  docstore=vector_index.docstore,
22
+ nodes=all_nodes,
23
+ similarity_top_k=20,
24
  )
25
 
26
  vector_retriever = VectorIndexRetriever(
27
  index=vector_index,
28
  similarity_top_k=30,
29
+ similarity_cutoff=0.7,
30
  )
31
 
32
  hybrid_retriever = QueryFusionRetriever(
33
  [vector_retriever, bm25_retriever],
34
  similarity_top_k=40,
35
+ num_queries=1,
36
  )
37
 
38
  custom_prompt_template = PromptTemplate(PROMPT_SIMPLE_POISK)
39
  response_synthesizer = get_response_synthesizer(
40
  response_mode=ResponseMode.COMPACT,
41
+ text_qa_template=custom_prompt_template,
42
  )
43
 
44
  query_engine = RetrieverQueryEngine(
45
  retriever=hybrid_retriever,
46
+ response_synthesizer=response_synthesizer,
47
  )
48
 
49
  log_message("Query engine успешно создан")