Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -5,7 +5,7 @@ import logging
|
|
| 5 |
import io
|
| 6 |
import requests
|
| 7 |
from bs4 import BeautifulSoup
|
| 8 |
-
from PyPDF2 import PdfReader
|
| 9 |
import pdfplumber
|
| 10 |
import docx
|
| 11 |
from langchain.text_splitter import CharacterTextSplitter
|
|
@@ -110,10 +110,6 @@ def main():
|
|
| 110 |
for link in pdf_links:
|
| 111 |
text += fetch_and_process_pdf(link)
|
| 112 |
|
| 113 |
-
|
| 114 |
-
|
| 115 |
-
#text = read_documents_from_directory(train_directory)
|
| 116 |
-
|
| 117 |
# Processing text and setting up the AI model
|
| 118 |
char_text_splitter = CharacterTextSplitter(separator="\n", chunk_size=1000,
|
| 119 |
chunk_overlap=200, length_function=len)
|
|
|
|
| 5 |
import io
|
| 6 |
import requests
|
| 7 |
from bs4 import BeautifulSoup
|
| 8 |
+
#from PyPDF2 import PdfReader
|
| 9 |
import pdfplumber
|
| 10 |
import docx
|
| 11 |
from langchain.text_splitter import CharacterTextSplitter
|
|
|
|
| 110 |
for link in pdf_links:
|
| 111 |
text += fetch_and_process_pdf(link)
|
| 112 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 113 |
# Processing text and setting up the AI model
|
| 114 |
char_text_splitter = CharacterTextSplitter(separator="\n", chunk_size=1000,
|
| 115 |
chunk_overlap=200, length_function=len)
|