Update app.py
Browse files
app.py
CHANGED
|
@@ -65,14 +65,12 @@ YOUTUBE_DIR = "/youtube"
|
|
| 65 |
|
| 66 |
###############################################
|
| 67 |
#URLs zu Dokumenten oder andere Inhalte, die einbezogen werden sollen
|
| 68 |
-
|
| 69 |
WEB_URL = "https://openai.com/research/gpt-4"
|
| 70 |
YOUTUBE_URL_1 = "https://www.youtube.com/watch?v=--khbXchTeE"
|
| 71 |
YOUTUBE_URL_2 = "https://www.youtube.com/watch?v=hdhZwyf24mE"
|
| 72 |
#YOUTUBE_URL_3 = "https://www.youtube.com/watch?v=vw-KWfKwvTQ"
|
| 73 |
|
| 74 |
-
#URL zu PDF dokumenten, die online verfügbar sind...
|
| 75 |
-
PDF_URL = "..."
|
| 76 |
|
| 77 |
|
| 78 |
################################################
|
|
@@ -142,11 +140,11 @@ def document_loading_splitting():
|
|
| 142 |
|
| 143 |
#andere loader...
|
| 144 |
# Load PDF
|
| 145 |
-
|
| 146 |
-
|
| 147 |
# Load Web
|
| 148 |
-
|
| 149 |
-
|
| 150 |
# Load YouTube
|
| 151 |
#loader = GenericLoader(YoutubeAudioLoader([YOUTUBE_URL_1,YOUTUBE_URL_2], PATH_WORK + YOUTUBE_DIR), OpenAIWhisperParser())
|
| 152 |
#docs.extend(loader.load())
|
|
|
|
| 65 |
|
| 66 |
###############################################
|
| 67 |
#URLs zu Dokumenten oder andere Inhalte, die einbezogen werden sollen
|
| 68 |
+
PDF_URL = "https://arxiv.org/pdf/2303.08774.pdf"
|
| 69 |
WEB_URL = "https://openai.com/research/gpt-4"
|
| 70 |
YOUTUBE_URL_1 = "https://www.youtube.com/watch?v=--khbXchTeE"
|
| 71 |
YOUTUBE_URL_2 = "https://www.youtube.com/watch?v=hdhZwyf24mE"
|
| 72 |
#YOUTUBE_URL_3 = "https://www.youtube.com/watch?v=vw-KWfKwvTQ"
|
| 73 |
|
|
|
|
|
|
|
| 74 |
|
| 75 |
|
| 76 |
################################################
|
|
|
|
| 140 |
|
| 141 |
#andere loader...
|
| 142 |
# Load PDF
|
| 143 |
+
loader = PyPDFLoader(PDF_URL1)
|
| 144 |
+
docs.extend(loader.load())
|
| 145 |
# Load Web
|
| 146 |
+
loader = WebBaseLoader(WEB_URL)
|
| 147 |
+
docs.extend(loader.load())
|
| 148 |
# Load YouTube
|
| 149 |
#loader = GenericLoader(YoutubeAudioLoader([YOUTUBE_URL_1,YOUTUBE_URL_2], PATH_WORK + YOUTUBE_DIR), OpenAIWhisperParser())
|
| 150 |
#docs.extend(loader.load())
|