ancirius commited on
Commit
9ecde64
·
verified ·
1 Parent(s): ff9eabf

Update retriever.py

Browse files
Files changed (1) hide show
  1. retriever.py +18 -0
retriever.py CHANGED
@@ -1,6 +1,24 @@
1
  from langchain_community.retrievers import BM25Retriever
2
  from langchain.tools import Tool
 
 
3
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4
  bm25_retriever = BM25Retriever.from_documents(docs)
5
 
6
  def extract_text(query: str) -> str:
 
1
  from langchain_community.retrievers import BM25Retriever
2
  from langchain.tools import Tool
3
+ import datasets
4
+ from langchain.docstore.document import Document
5
 
6
+ # Load the dataset
7
+ guest_dataset = datasets.load_dataset("agents-course/unit3-invitees", split="train")
8
+
9
+ # Convert dataset entries into Document objects
10
+ docs = [
11
+ Document(
12
+ page_content="\n".join([
13
+ f"Name: {guest['name']}",
14
+ f"Relation: {guest['relation']}",
15
+ f"Description: {guest['description']}",
16
+ f"Email: {guest['email']}"
17
+ ]),
18
+ metadata={"name": guest["name"]}
19
+ )
20
+ for guest in guest_dataset
21
+ ]
22
  bm25_retriever = BM25Retriever.from_documents(docs)
23
 
24
  def extract_text(query: str) -> str: