Spaces:

TKM03
/

PDF_based_chatbot

Build error

App Files Files Community

TKM03 commited on Feb 18, 2025

Commit

dfc5079

verified ·

1 Parent(s): 3991753

version7

Browse files

Files changed (1) hide show

app.py +2 -26

app.py CHANGED Viewed

@@ -16,21 +16,13 @@ def extract_text_from_pdf(pdf_file):
     pdf_text = ""
     try:
-        # Save the uploaded file to a temporary file
-        with tempfile.NamedTemporaryFile(delete=False, suffix='.pdf') as temp_pdf:
-            temp_pdf.write(pdf_file)
-            temp_path = temp_pdf.name
-        # Open the temporary file with PyPDF2
-        with open(temp_path, 'rb') as f:
             pdf_reader = PyPDF2.PdfReader(f)
             for page_num in range(len(pdf_reader.pages)):
                 page = pdf_reader.pages[page_num]
                 pdf_text += page.extract_text() + "\n"
-        # Clean up the temporary file
-        os.unlink(temp_path)
     except Exception as e:
         return f"Error processing PDF: {str(e)}"
@@ -122,22 +114,6 @@ def query_qa_system(question, model, index, text_chunks, similarity_threshold=0.
             'found_answer': False
         }
-def ask_question(question, model, index, text_chunks):
-    """
-    User-friendly interface for asking questions
-    """
-    result = query_qa_system(question, model, index, text_chunks)
-    print("\nQ:", question)
-    print("-" * 50)
-    if result['found_answer']:
-        print(f"Found matching section (confidence: {result['confidence']:.2f}):")
-        print(f"\n{result['full_text']}\n")
-        return result
-    else:
-        print(result['full_text'])
-        print(f"Best match confidence: {result['confidence']:.2f}")
-        return result
 # Global variables to store model, index, and text chunks
 global_model = None
 global_index = None

     pdf_text = ""
     try:
+        # In Hugging Face Spaces, pdf_file is already a file path
+        with open(pdf_file.name, 'rb') as f:
             pdf_reader = PyPDF2.PdfReader(f)
             for page_num in range(len(pdf_reader.pages)):
                 page = pdf_reader.pages[page_num]
                 pdf_text += page.extract_text() + "\n"
     except Exception as e:
         return f"Error processing PDF: {str(e)}"
             'found_answer': False
         }
 # Global variables to store model, index, and text chunks
 global_model = None
 global_index = None