minh-4T commited on
Commit
01728f2
·
verified ·
1 Parent(s): 1cd07dd

update BM25

Browse files
Files changed (1) hide show
  1. core/retriever.py +1 -1
core/retriever.py CHANGED
@@ -8,7 +8,7 @@ class HybridRetriever:
8
  self.documents = documents
9
  print(" Đang khởi tạo BM25...")
10
  tokenized_docs = [doc.page_content.lower().split() for doc in documents]
11
- self.bm25 = BM25Okapi(tokenized_docs)
12
  print(" BM25 sẵn sàng!")
13
 
14
  def search(self, query: str, k: int = 10, alpha: float = 0.6) -> List:
 
8
  self.documents = documents
9
  print(" Đang khởi tạo BM25...")
10
  tokenized_docs = [doc.page_content.lower().split() for doc in documents]
11
+ self.bm25 = BM25Okapi(tokenized_docs,k1=1.5, b=0.5)
12
  print(" BM25 sẵn sàng!")
13
 
14
  def search(self, query: str, k: int = 10, alpha: float = 0.6) -> List: