Ilyas KHIAT
commited on
Commit
·
3bd3ddd
1
Parent(s):
6f0715e
modif
Browse files- .streamlit/config.toml +2 -0
- RAG_PDF_WEB.py +2 -2
.streamlit/config.toml
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[server]
|
| 2 |
+
maxUploadSize = 200
|
RAG_PDF_WEB.py
CHANGED
|
@@ -28,8 +28,8 @@ def get_pdf_text(pdf_docs):
|
|
| 28 |
def get_text_chunks(text):
|
| 29 |
text_splitter = CharacterTextSplitter(
|
| 30 |
separator="\n",
|
| 31 |
-
chunk_size=
|
| 32 |
-
chunk_overlap=
|
| 33 |
length_function=len # the length function - in this case, character length (aka the python len() fn.)
|
| 34 |
)
|
| 35 |
chunks = text_splitter.split_text(text)
|
|
|
|
| 28 |
def get_text_chunks(text):
|
| 29 |
text_splitter = CharacterTextSplitter(
|
| 30 |
separator="\n",
|
| 31 |
+
chunk_size=1000, # the character length of the chunck
|
| 32 |
+
chunk_overlap=200, # the character length of the overlap between chuncks
|
| 33 |
length_function=len # the length function - in this case, character length (aka the python len() fn.)
|
| 34 |
)
|
| 35 |
chunks = text_splitter.split_text(text)
|