Spaces:

amendolajine
/

OPIT

Running

amendolajine commited on Dec 2, 2023

Commit

6c26e5d

1 Parent(s): ec7206a

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -24,27 +24,15 @@ def extract_abstract(pdf_bytes):
 # Function to process text (summarize and convert to speech)
 def process_text(uploaded_file):
-    # Diagnostic print statements
-    print(f"Uploaded file type: {type(uploaded_file)}")
-    if isinstance(uploaded_file, dict):
-        print("Uploaded file is a dictionary.")
-        print(f"Keys available: {uploaded_file.keys()}")
-    # Assuming uploaded_file is a dictionary and contains 'data' key
     try:
-        pdf_bytes = uploaded_file["data"]
-    except (TypeError, KeyError):
-        print("Error accessing 'data' key in uploaded_file")
         return "File content could not be retrieved", None
-# Function to process text (summarize and convert to speech)
-#def process_text(uploaded_file):
-    # Extract the file data (byte content) from the uploaded file
-    # Check if 'content' key exists, and use it to access the file's byte content
-#    if "content" in uploaded_file:
-#        pdf_bytes = uploaded_file["data"]
-#    else:
-#        return "File content could not be retrieved", None
     # Generate summary
     inputs = tokenizer([abstract_text], max_length=1024, return_tensors='pt', truncation=True)

 # Function to process text (summarize and convert to speech)
 def process_text(uploaded_file):
+    # Attempt to extract byte content from NamedString object
     try:
+        pdf_bytes = uploaded_file.file.read()
+    except AttributeError:
+        print("Error reading file content from uploaded_file")
         return "File content could not be retrieved", None
+    # Extract abstract from PDF
+    abstract_text = extract_abstract(pdf_bytes)
     # Generate summary
     inputs = tokenizer([abstract_text], max_length=1024, return_tensors='pt', truncation=True)