Spaces:
Paused
Paused
Mikiko Bazeley commited on
Commit ·
a23f69d
1
Parent(s): 83b451a
fixed docloader
Browse files
app.py
CHANGED
|
@@ -46,9 +46,9 @@ HF_TOKEN = os.environ["HF_TOKEN"]
|
|
| 46 |
### NOTE: PAY ATTENTION TO THE PATH THEY ARE IN.
|
| 47 |
|
| 48 |
# Mikiko: Leveraging PyMUPDFLoader to load PDF - from Assignment 6
|
| 49 |
-
|
| 50 |
# document_loader = TextLoader("./data/paul_graham_essays.txt")
|
| 51 |
-
documents = document_loader.load()
|
| 52 |
|
| 53 |
### 2. CREATE TEXT SPLITTER AND SPLIT DOCUMENTS
|
| 54 |
# text_splitter = RecursiveCharacterTextSplitter(chunk_size=1000, chunk_overlap=30)
|
|
|
|
| 46 |
### NOTE: PAY ATTENTION TO THE PATH THEY ARE IN.
|
| 47 |
|
| 48 |
# Mikiko: Leveraging PyMUPDFLoader to load PDF - from Assignment 6
|
| 49 |
+
documents = PyMuPDFLoader("./data/airbnb10k.pdf").load()
|
| 50 |
# document_loader = TextLoader("./data/paul_graham_essays.txt")
|
| 51 |
+
# documents = document_loader.load()
|
| 52 |
|
| 53 |
### 2. CREATE TEXT SPLITTER AND SPLIT DOCUMENTS
|
| 54 |
# text_splitter = RecursiveCharacterTextSplitter(chunk_size=1000, chunk_overlap=30)
|