Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -15,6 +15,7 @@ from aimakerspace.vectordatabase import VectorDatabase
|
|
| 15 |
from aimakerspace.openai_utils.chatmodel import ChatOpenAI
|
| 16 |
import chainlit as cl
|
| 17 |
from langchain_community.document_loaders import PyPDFLoader
|
|
|
|
| 18 |
|
| 19 |
system_template = """\
|
| 20 |
Use the following context to answer a users question. If you cannot find the answer in the context, say you don't know the answer."""
|
|
@@ -58,7 +59,10 @@ class RetrievalAugmentedQAPipeline:
|
|
| 58 |
|
| 59 |
|
| 60 |
text_splitter = CharacterTextSplitter()
|
| 61 |
-
|
|
|
|
|
|
|
|
|
|
| 62 |
|
| 63 |
def process_text_file(file: AskFileResponse):
|
| 64 |
import tempfile
|
|
@@ -90,7 +94,7 @@ def process_pdf_file(file: AskFileResponse):
|
|
| 90 |
|
| 91 |
pdf_loader = PyPDFLoader(temp_file_path)
|
| 92 |
documents = pdf_loader.load()
|
| 93 |
-
texts =
|
| 94 |
return texts
|
| 95 |
|
| 96 |
|
|
|
|
| 15 |
from aimakerspace.openai_utils.chatmodel import ChatOpenAI
|
| 16 |
import chainlit as cl
|
| 17 |
from langchain_community.document_loaders import PyPDFLoader
|
| 18 |
+
from langchain_text_splitters import RecursiveCharacterTextSplitter
|
| 19 |
|
| 20 |
system_template = """\
|
| 21 |
Use the following context to answer a users question. If you cannot find the answer in the context, say you don't know the answer."""
|
|
|
|
| 59 |
|
| 60 |
|
| 61 |
text_splitter = CharacterTextSplitter()
|
| 62 |
+
pdf_text_splitter = RecursiveCharacterTextSplitter(
|
| 63 |
+
chunk_size=1000,
|
| 64 |
+
chunk_overlap=200,
|
| 65 |
+
)
|
| 66 |
|
| 67 |
def process_text_file(file: AskFileResponse):
|
| 68 |
import tempfile
|
|
|
|
| 94 |
|
| 95 |
pdf_loader = PyPDFLoader(temp_file_path)
|
| 96 |
documents = pdf_loader.load()
|
| 97 |
+
texts = pdf_text_splitter.split_texts(documents)
|
| 98 |
return texts
|
| 99 |
|
| 100 |
|