IsmaeelPandey commited on
Commit
d2a7723
·
1 Parent(s): 7cd66f5

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +11 -3
app.py CHANGED
@@ -25,14 +25,22 @@ os.environ["HUGGINGFACEHUB_API_TOKEN"] = "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"
25
  embedding = HuggingFaceHubEmbeddings()
26
 
27
  loader = PyPDFLoader("1.pdf")
28
- pages = loader.load_and_split()
 
 
 
 
 
 
 
 
 
 
29
 
30
  text_splitter = RecursiveCharacterTextSplitter(chunk_size=500, chunk_overlap=50)
31
  docs = text_splitter.split_documents(pages)
32
 
33
- loader2 = PyPDFLoader("2.pdf")
34
  pages2 = loader2.load_and_split()
35
- docs.append(text_splitter.split_documents(pages2))
36
 
37
  vectorstore = Chroma.from_documents(documents=docs, embedding=embedding)
38
 
 
25
  embedding = HuggingFaceHubEmbeddings()
26
 
27
  loader = PyPDFLoader("1.pdf")
28
+ loader2 = PyPDFLoader("2.pdf")
29
+ loaders = []
30
+
31
+ loaders.append(loader)
32
+ loaders.append(loader2)
33
+
34
+ loaderdocs = []
35
+ for l in loaders:
36
+ loaderdocs.extend(l.load_and_split())
37
+ text_splitter = RecursiveCharacterTextSplitter(chunk_size=500, chunk_overlap=0)
38
+ docs = text_splitter.split_documents(loaderdocs)
39
 
40
  text_splitter = RecursiveCharacterTextSplitter(chunk_size=500, chunk_overlap=50)
41
  docs = text_splitter.split_documents(pages)
42
 
 
43
  pages2 = loader2.load_and_split()
 
44
 
45
  vectorstore = Chroma.from_documents(documents=docs, embedding=embedding)
46