Samyurta commited on
Commit
73a7009
·
1 Parent(s): 77cf134

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +7 -4
app.py CHANGED
@@ -16,10 +16,13 @@ from langchain.embeddings.sentence_transformer import SentenceTransformerEmbeddi
16
 
17
  def get_pdf_text(pdf_docs):
18
  text = ""
19
- for pdf in pdf_docs:
20
- pdf_reader = PdfReader(pdf)
21
- for page in pdf_reader.pages:
22
- text += page.extract_text()
 
 
 
23
  return text
24
 
25
 
 
16
 
17
  def get_pdf_text(pdf_docs):
18
  text = ""
19
+ pdf_document = fitz.open(pdf_path)
20
+
21
+ for page_number in range(pdf_document.page_count):
22
+ page = pdf_document[page_number]
23
+ text += page.get_text()
24
+
25
+ pdf_document.close()
26
  return text
27
 
28