Spaces:

akazmi
/

Legal2

Sleeping

akazmi commited on Nov 11, 2024

Commit

c292876

verified ·

1 Parent(s): bb9ec18

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -10,14 +10,18 @@ import numpy as np
 # Initialize Groq API
 client = Groq(api_key=os.getenv("GROQ_API_KEY"))
-# Function to list PDF files in the current directory
 def list_pdf_files():
-    pdf_files = [f for f in os.listdir('.') if f.endswith('.pdf')]
     return pdf_files
 # Function to extract text and split into chunks using pdfplumber
-def extract_text_from_pdf(file_path):
     try:
         full_text = ""
         with pdfplumber.open(file_path) as pdf:
             for page in pdf.pages:
@@ -48,8 +52,8 @@ def retrieve_relevant_chunks(chunks, question):
         return ""
 # Function to answer the question using selected relevant chunks
-def answer_question(pdf_file, question):
-    chunks = extract_text_from_pdf(pdf_file)
     if not chunks:
         return "Error: Could not extract text from PDF."

 # Initialize Groq API
 client = Groq(api_key=os.getenv("GROQ_API_KEY"))
+# Path to the directory containing PDFs in Hugging Face Space
+PDF_DIR = "./Legal2/main"
+# Function to list PDF files in the Hugging Face Space directory
 def list_pdf_files():
+    pdf_files = [f for f in os.listdir(PDF_DIR) if f.endswith('.pdf')]
     return pdf_files
 # Function to extract text and split into chunks using pdfplumber
+def extract_text_from_pdf(file_name):
     try:
+        file_path = os.path.join(PDF_DIR, file_name)
         full_text = ""
         with pdfplumber.open(file_path) as pdf:
             for page in pdf.pages:
         return ""
 # Function to answer the question using selected relevant chunks
+def answer_question(file_name, question):
+    chunks = extract_text_from_pdf(file_name)
     if not chunks:
         return "Error: Could not extract text from PDF."