Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -16,10 +16,13 @@ from langchain.embeddings.sentence_transformer import SentenceTransformerEmbeddi
|
|
| 16 |
|
| 17 |
def get_pdf_text(pdf_docs):
|
| 18 |
text = ""
|
| 19 |
-
|
| 20 |
-
|
| 21 |
-
|
| 22 |
-
|
|
|
|
|
|
|
|
|
|
| 23 |
return text
|
| 24 |
|
| 25 |
|
|
|
|
| 16 |
|
| 17 |
def get_pdf_text(pdf_docs):
|
| 18 |
text = ""
|
| 19 |
+
pdf_document = fitz.open(pdf_path)
|
| 20 |
+
|
| 21 |
+
for page_number in range(pdf_document.page_count):
|
| 22 |
+
page = pdf_document[page_number]
|
| 23 |
+
text += page.get_text()
|
| 24 |
+
|
| 25 |
+
pdf_document.close()
|
| 26 |
return text
|
| 27 |
|
| 28 |
|