JARVISXIRONMAN commited on
Commit
bab38b6
·
verified ·
1 Parent(s): bcbf03f

Create retriever.py

Browse files
Files changed (1) hide show
  1. utils/retriever.py +18 -7
utils/retriever.py CHANGED
@@ -1,10 +1,21 @@
1
- # utils/retriever.py
2
-
3
  import os
4
- from langchain.vectorstores import Chroma
5
- from langchain.embeddings import HuggingFaceEmbeddings
 
 
 
 
 
 
6
 
7
- def load_vectorstore(folder_path="data/vectorstore"):
8
  embeddings = HuggingFaceEmbeddings(model_name="sentence-transformers/all-MiniLM-L6-v2")
9
- vectordb = Chroma(persist_directory=folder_path, embedding_function=embeddings)
10
- return vectordb
 
 
 
 
 
 
 
 
 
 
1
  import os
2
+ from langchain_community.vectorstores import Chroma
3
+ from langchain_community.embeddings import HuggingFaceEmbeddings
4
+ from langchain_core.vectorstores import VectorStoreRetriever
5
+
6
+ def load_vectorstore(pdf_path: str) -> VectorStoreRetriever:
7
+ # Ensure Chroma store directory exists
8
+ folder_path = "chroma_store"
9
+ os.makedirs(folder_path, exist_ok=True)
10
 
11
+ # Use a local embedding model (no API key needed)
12
  embeddings = HuggingFaceEmbeddings(model_name="sentence-transformers/all-MiniLM-L6-v2")
13
+
14
+ # Initialize Chroma without deprecated Settings
15
+ vectordb = Chroma(
16
+ persist_directory=folder_path,
17
+ embedding_function=embeddings
18
+ )
19
+
20
+ # Return retriever
21
+ return vectordb.as_retriever()