Spaces:

QuaidKhalid
/

PDFChatBot

Sleeping

QuaidKhalid commited on Aug 31, 2024

Commit

aa1686a

verified ·

1 Parent(s): 99c3c54

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -7,6 +7,8 @@ from langchain_core.runnables import RunnablePassthrough
 from langchain_text_splitters import RecursiveCharacterTextSplitter
 from sentence_transformers import SentenceTransformer
 import torch
 # Define the embedding class
@@ -35,11 +37,15 @@ langchain_api_key = "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"
 def load_document(document_path):
     try:
-        loader = PyPDFLoader(document_path)
-        docs = loader.load()
-        text_splitter = RecursiveCharacterTextSplitter(chunk_size=4000, chunk_overlap=200)
-        splits = text_splitter.split_documents(docs)
-        return splits
     except Exception as e:
         return str(e)
@@ -85,4 +91,6 @@ if document_path is not None and query:
             result = answer_question(rag_chain, query)
             st.write("Result:", result)
 st.write("Note: Replace `llm` with an appropriate language model.")

 from langchain_text_splitters import RecursiveCharacterTextSplitter
 from sentence_transformers import SentenceTransformer
 import torch
+import os
+import tempfile
 # Define the embedding class
 def load_document(document_path):
     try:
+        with tempfile.TemporaryDirectory() as tmp_dir:
+            tmp_file = os.path.join(tmp_dir, 'temp.pdf')
+            with open(tmp_file, 'wb') as f:
+                f.write(document_path.getvalue())
+            loader = PyPDFLoader(tmp_file)
+            docs = loader.load()
+            text_splitter = RecursiveCharacterTextSplitter(chunk_size=4000, chunk_overlap=200)
+            splits = text_splitter.split_documents(docs)
+            return splits
     except Exception as e:
         return str(e)
             result = answer_question(rag_chain, query)
             st.write("Result:", result)
 st.write("Note: Replace `llm` with an appropriate language model.")