Update utils.py
Browse files
utils.py
CHANGED
|
@@ -214,14 +214,14 @@ def document_loading_splitting():
|
|
| 214 |
|
| 215 |
#andere loader...
|
| 216 |
# Load PDF
|
| 217 |
-
loader = PyPDFLoader(PDF_URL)
|
| 218 |
-
docs.extend(loader.load())
|
| 219 |
# Load Web
|
| 220 |
-
loader = WebBaseLoader(WEB_URL)
|
| 221 |
-
docs.extend(loader.load())
|
| 222 |
# Load YouTube
|
| 223 |
-
loader = GenericLoader(YoutubeAudioLoader([YOUTUBE_URL_1,YOUTUBE_URL_2], PATH_WORK + YOUTUBE_DIR), OpenAIWhisperParser())
|
| 224 |
-
docs.extend(loader.load())
|
| 225 |
################################
|
| 226 |
# Document splitting
|
| 227 |
text_splitter = RecursiveCharacterTextSplitter(chunk_overlap = 150, chunk_size = 1500)
|
|
|
|
| 214 |
|
| 215 |
#andere loader...
|
| 216 |
# Load PDF
|
| 217 |
+
#loader = PyPDFLoader(PDF_URL)
|
| 218 |
+
#docs.extend(loader.load())
|
| 219 |
# Load Web
|
| 220 |
+
#loader = WebBaseLoader(WEB_URL)
|
| 221 |
+
#docs.extend(loader.load())
|
| 222 |
# Load YouTube
|
| 223 |
+
#loader = GenericLoader(YoutubeAudioLoader([YOUTUBE_URL_1,YOUTUBE_URL_2], PATH_WORK + YOUTUBE_DIR), OpenAIWhisperParser())
|
| 224 |
+
#docs.extend(loader.load())
|
| 225 |
################################
|
| 226 |
# Document splitting
|
| 227 |
text_splitter = RecursiveCharacterTextSplitter(chunk_overlap = 150, chunk_size = 1500)
|