amalsp commited on
Commit
1011c08
·
verified ·
1 Parent(s): d11d1d2

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +5 -2
app.py CHANGED
@@ -3,7 +3,7 @@ import bs4
3
  from langchain.text_splitter import RecursiveCharacterTextSplitter
4
  from langchain_community.document_loaders import WebBaseLoader
5
  from langchain_community.vectorstores import Chroma
6
- from langchain_community.embeddings import HuggingFaceHubEmbeddings # Updated import
7
  from dotenv import load_dotenv
8
  import os
9
 
@@ -47,7 +47,10 @@ def load_and_retrieve_docs(url, max_retries=3):
47
  docs = loader.load()
48
  text_splitter = RecursiveCharacterTextSplitter(chunk_size=1000, chunk_overlap=200)
49
  splits = text_splitter.split_documents(docs)
50
- embeddings = HuggingFaceHubEmbeddings(model_name="sentence-transformers/all-mpnet-base-v2") # Updated embeddings
 
 
 
51
  vectorstore = Chroma.from_documents(documents=splits, embedding=embeddings)
52
  return vectorstore.as_retriever()
53
  except ReadTimeout:
 
3
  from langchain.text_splitter import RecursiveCharacterTextSplitter
4
  from langchain_community.document_loaders import WebBaseLoader
5
  from langchain_community.vectorstores import Chroma
6
+ from langchain_huggingface import HuggingFaceEndpointEmbeddings # Updated import
7
  from dotenv import load_dotenv
8
  import os
9
 
 
47
  docs = loader.load()
48
  text_splitter = RecursiveCharacterTextSplitter(chunk_size=1000, chunk_overlap=200)
49
  splits = text_splitter.split_documents(docs)
50
+ embeddings = HuggingFaceEndpointEmbeddings(
51
+ endpoint_url="https://api-inference.huggingface.co/models/sentence-transformers/all-mpnet-base-v2",
52
+ api_key=os.environ["HUGGINGFACE_API_KEY"]
53
+ ) # Updated embeddings
54
  vectorstore = Chroma.from_documents(documents=splits, embedding=embeddings)
55
  return vectorstore.as_retriever()
56
  except ReadTimeout: