Spaces:

amendolajine
/

OPIT

Running

amendolajine commited on Dec 2, 2023

Commit

ec7206a

1 Parent(s): 41dd0e4

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -24,11 +24,19 @@ def extract_abstract(pdf_bytes):
 # Function to process text (summarize and convert to speech)
 def process_text(uploaded_file):
-    # Extract the file data (byte content) from the uploaded file
-    pdf_bytes = uploaded_file["data"]
-    abstract_text = extract_abstract(pdf_bytes)
 # Function to process text (summarize and convert to speech)
 #def process_text(uploaded_file):
     # Extract the file data (byte content) from the uploaded file
@@ -38,8 +46,6 @@ def process_text(uploaded_file):
 #    else:
 #        return "File content could not be retrieved", None
     # Generate summary
     inputs = tokenizer([abstract_text], max_length=1024, return_tensors='pt', truncation=True)
     summary_ids = model.generate(inputs['input_ids'], num_beams=4, max_length=40, min_length=10, length_penalty=2.0, early_stopping=True, no_repeat_ngram_size=2)

 # Function to process text (summarize and convert to speech)
 def process_text(uploaded_file):
+    # Diagnostic print statements
+    print(f"Uploaded file type: {type(uploaded_file)}")
+    if isinstance(uploaded_file, dict):
+        print("Uploaded file is a dictionary.")
+        print(f"Keys available: {uploaded_file.keys()}")
+    # Assuming uploaded_file is a dictionary and contains 'data' key
+    try:
+        pdf_bytes = uploaded_file["data"]
+    except (TypeError, KeyError):
+        print("Error accessing 'data' key in uploaded_file")
+        return "File content could not be retrieved", None
 # Function to process text (summarize and convert to speech)
 #def process_text(uploaded_file):
     # Extract the file data (byte content) from the uploaded file
 #    else:
 #        return "File content could not be retrieved", None
     # Generate summary
     inputs = tokenizer([abstract_text], max_length=1024, return_tensors='pt', truncation=True)
     summary_ids = model.generate(inputs['input_ids'], num_beams=4, max_length=40, min_length=10, length_penalty=2.0, early_stopping=True, no_repeat_ngram_size=2)