Spaces:
Sleeping
Sleeping
Commit ·
6426c42
1
Parent(s): a7fc579
try 9
Browse files- app/core/processor.py +2 -1
app/core/processor.py
CHANGED
|
@@ -2,6 +2,7 @@ from langchain_community.document_loaders import (
|
|
| 2 |
UnstructuredWordDocumentLoader,
|
| 3 |
TextLoader,
|
| 4 |
CSVLoader,
|
|
|
|
| 5 |
UnstructuredMarkdownLoader,
|
| 6 |
)
|
| 7 |
from langchain_text_splitters import RecursiveCharacterTextSplitter
|
|
@@ -107,7 +108,7 @@ class DocumentProcessor:
|
|
| 107 |
loader = None
|
| 108 |
parallelization = False
|
| 109 |
if filepath.endswith(".pdf"):
|
| 110 |
-
loader =
|
| 111 |
file_path=filepath
|
| 112 |
) # splits each presentation into slides and processes it as separate file
|
| 113 |
parallelization = False
|
|
|
|
| 2 |
UnstructuredWordDocumentLoader,
|
| 3 |
TextLoader,
|
| 4 |
CSVLoader,
|
| 5 |
+
PyPDFLoader,
|
| 6 |
UnstructuredMarkdownLoader,
|
| 7 |
)
|
| 8 |
from langchain_text_splitters import RecursiveCharacterTextSplitter
|
|
|
|
| 108 |
loader = None
|
| 109 |
parallelization = False
|
| 110 |
if filepath.endswith(".pdf"):
|
| 111 |
+
loader = PyPDFLoader(
|
| 112 |
file_path=filepath
|
| 113 |
) # splits each presentation into slides and processes it as separate file
|
| 114 |
parallelization = False
|