Spaces:

nikhmr1235
/

PDF_document_chatbot

Sleeping

App Files Files Community

nikhmr1235 commited on Aug 29, 2025

Commit

bc68e2a

verified ·

1 Parent(s): 0215574

attempt to fix keyError:7 for global object:state

Browse files

Files changed (1) hide show

app.py +8 -14

app.py CHANGED Viewed

@@ -59,21 +59,15 @@ def process_pdf(pdf_file, state):
                 state
             )
-        # Remove the old temporary directory if it exists
-        if os.path.exists(state.vector_store_path):
-            shutil.rmtree(state.vector_store_path)
-            state.db = None  # Reset the database state
-        # Create a new session and directory for the user
-        state.session_id = str(uuid.uuid4())
-        state.vector_store_path = os.path.join(CHROMA_DB_PATH, state.session_id)
-        os.makedirs(state.vector_store_path)
         # Extract text from the PDF using PyMuPDF (fitz)
         doc = fitz.open(pdf_file.name)
         text = ""
         for page in doc:
-            text += page.get_text()
         doc.close()
         # Split text into chunks
@@ -82,10 +76,10 @@ def process_pdf(pdf_file, state):
         # Create a ChromaDB vector store from the documents
         embeddings = GoogleGenerativeAIEmbeddings(model=EMBEDDING_MODEL)
-        state.db = Chroma.from_documents(
             documents=docs,
             embedding=embeddings,
-            persist_directory=state.vector_store_path
         )
         gr.Info("PDF processed successfully! You can now ask questions about the document.")
@@ -94,11 +88,11 @@ def process_pdf(pdf_file, state):
         return (
             gr.update(interactive=False),
             gr.update(visible=True),
-            state
         )
     except Exception as e:
         # Clean up the directory in case of an error
-        if os.path.exists(state.vector_store_path):
             shutil.rmtree(state.vector_store_path)
         gr.Error(f"An error occurred: {str(e)}")
         # Re-enable the file upload in case of error

                 state
             )
+        # If a file is uploaded, a new session should be started
+        # The new session object is returned to update the state
+        new_state = new_session()
         # Extract text from the PDF using PyMuPDF (fitz)
         doc = fitz.open(pdf_file.name)
         text = ""
         for page in doc:
+            text += doc.get_text()
         doc.close()
         # Split text into chunks
         # Create a ChromaDB vector store from the documents
         embeddings = GoogleGenerativeAIEmbeddings(model=EMBEDDING_MODEL)
+        new_state.db = Chroma.from_documents(
             documents=docs,
             embedding=embeddings,
+            persist_directory=new_state.vector_store_path
         )
         gr.Info("PDF processed successfully! You can now ask questions about the document.")
         return (
             gr.update(interactive=False),
             gr.update(visible=True),
+            new_state
         )
     except Exception as e:
         # Clean up the directory in case of an error
+        if state and os.path.exists(state.vector_store_path):
             shutil.rmtree(state.vector_store_path)
         gr.Error(f"An error occurred: {str(e)}")
         # Re-enable the file upload in case of error