Spaces:
Sleeping
Sleeping
Commit
·
5bdb023
1
Parent(s):
3db8611
Update app.py
Browse files
app.py
CHANGED
|
@@ -24,6 +24,13 @@ from langchain.document_loaders import PyPDFDirectoryLoader
|
|
| 24 |
os.environ["HUGGINGFACEHUB_API_TOKEN"] = "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"
|
| 25 |
embedding = HuggingFaceHubEmbeddings()
|
| 26 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 27 |
loader = PyPDFLoader("1.pdf")
|
| 28 |
loader2 = PyPDFLoader("2.pdf")
|
| 29 |
loaders = []
|
|
@@ -31,7 +38,6 @@ loaders = []
|
|
| 31 |
loaders.append(loader)
|
| 32 |
loaders.append(loader2)
|
| 33 |
|
| 34 |
-
loaderdocs = []
|
| 35 |
for l in loaders:
|
| 36 |
loaderdocs.extend(l.load_and_split())
|
| 37 |
text_splitter = RecursiveCharacterTextSplitter(chunk_size=500, chunk_overlap=0)
|
|
|
|
| 24 |
os.environ["HUGGINGFACEHUB_API_TOKEN"] = "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"
|
| 25 |
embedding = HuggingFaceHubEmbeddings()
|
| 26 |
|
| 27 |
+
loaderdocs = []
|
| 28 |
+
|
| 29 |
+
url = "https://nanoreview.net/en/phone-compare/samsung-galaxy-s9-vs-samsung-galaxy-s10"
|
| 30 |
+
loader3 = RecursiveUrlLoader(url=url, max_depth=1)
|
| 31 |
+
|
| 32 |
+
loaderdocs.extend(loader3.load())
|
| 33 |
+
|
| 34 |
loader = PyPDFLoader("1.pdf")
|
| 35 |
loader2 = PyPDFLoader("2.pdf")
|
| 36 |
loaders = []
|
|
|
|
| 38 |
loaders.append(loader)
|
| 39 |
loaders.append(loader2)
|
| 40 |
|
|
|
|
| 41 |
for l in loaders:
|
| 42 |
loaderdocs.extend(l.load_and_split())
|
| 43 |
text_splitter = RecursiveCharacterTextSplitter(chunk_size=500, chunk_overlap=0)
|