Spaces:

heerjtdev
/

example

Sleeping

App Files Files Community

heerjtdev commited on Feb 12

Commit

3eeedea

verified ·

1 Parent(s): 7bf9c65

Update app.py

Browse files

Files changed (1) hide show

app.py +19 -23

app.py CHANGED Viewed

@@ -153,25 +153,27 @@ def generate_qa_pairs(chunk: str, num_questions: int = 2) -> List[Dict[str, str]
 def process_pdf(pdf_file, questions_per_chunk: int = 2, max_chunks: int = 20):
     """Main processing function."""
     if pdf_file is None:
-        return "Please upload a PDF file.", None, None
     try:
         # Extract text
-        yield "📄 Extracting text from PDF...", None, None
         raw_text = extract_text_from_pdf(pdf_file)
         if raw_text.startswith("Error"):
-            return raw_text, None, None
         if len(raw_text.strip()) < 100:
-            return "PDF appears to be empty or contains no extractable text.", None, None
         # Clean text
-        yield "🧹 Cleaning text...", None, None
         cleaned_text = clean_text(raw_text)
         # Chunk text
-        yield "✂️ Chunking text into sections...", None, None
         chunks = chunk_text(cleaned_text)
         # Limit chunks for CPU performance
@@ -183,16 +185,17 @@ def process_pdf(pdf_file, questions_per_chunk: int = 2, max_chunks: int = 20):
         for i, chunk in enumerate(chunks):
             progress = f"🎴 Generating flashcards... ({i+1}/{total_chunks} chunks processed)"
-            yield progress, None, None
             cards = generate_qa_pairs(chunk, questions_per_chunk)
             all_flashcards.extend(cards)
         if not all_flashcards:
-            return "Could not generate flashcards from this PDF. Try a PDF with more textual content.", None, None
         # Format output
-        yield "✅ Finalizing...", None, None
         # Create formatted display
         display_text = format_flashcards_display(all_flashcards)
@@ -208,10 +211,13 @@ def process_pdf(pdf_file, questions_per_chunk: int = 2, max_chunks: int = 20):
             csv_lines.append(f'"{q}","{a}"')
         csv_output = "\n".join(csv_lines)
-        return display_text, csv_output, json_output
     except Exception as e:
-        return f"Error processing PDF: {str(e)}", None, None
 def format_flashcards_display(flashcards: List[Dict]) -> str:
     """Format flashcards for nice display."""
@@ -335,21 +341,11 @@ with gr.Blocks(css=custom_css, title="PDF to Flashcards") as demo:
             )
             gr.Markdown("*Raw JSON data for custom applications*")
-    # Event handlers
-    def update_display(status):
-        """Update display when processing is done."""
-        if status and not status.startswith(("📄", "🧹", "✂️", "🎴", "✅")):
-            return status
-        return gr.update()
     process_btn.click(
         fn=process_pdf,
         inputs=[pdf_input, questions_per_chunk, max_chunks],
-        outputs=[status_text, csv_output, json_output]
-    ).then(
-        fn=update_display,
-        inputs=status_text,
-        outputs=output_display
     )
     # Example section

 def process_pdf(pdf_file, questions_per_chunk: int = 2, max_chunks: int = 20):
     """Main processing function."""
     if pdf_file is None:
+        return "Please upload a PDF file.", "", "", "Your flashcards will appear here..."
     try:
         # Extract text
+        yield "📄 Extracting text from PDF...", "", "", "Processing..."
         raw_text = extract_text_from_pdf(pdf_file)
         if raw_text.startswith("Error"):
+            yield raw_text, "", "", "Error occurred"
+            return
         if len(raw_text.strip()) < 100:
+            yield "PDF appears to be empty or contains no extractable text.", "", "", "Error occurred"
+            return
         # Clean text
+        yield "🧹 Cleaning text...", "", "", "Processing..."
         cleaned_text = clean_text(raw_text)
         # Chunk text
+        yield "✂️ Chunking text into sections...", "", "", "Processing..."
         chunks = chunk_text(cleaned_text)
         # Limit chunks for CPU performance
         for i, chunk in enumerate(chunks):
             progress = f"🎴 Generating flashcards... ({i+1}/{total_chunks} chunks processed)"
+            yield progress, "", "", "Processing..."
             cards = generate_qa_pairs(chunk, questions_per_chunk)
             all_flashcards.extend(cards)
         if not all_flashcards:
+            yield "Could not generate flashcards from this PDF. Try a PDF with more textual content.", "", "", "No flashcards generated"
+            return
         # Format output
+        yield "✅ Finalizing...", "", "", "Almost done..."
         # Create formatted display
         display_text = format_flashcards_display(all_flashcards)
             csv_lines.append(f'"{q}","{a}"')
         csv_output = "\n".join(csv_lines)
+        # FINAL OUTPUT - this updates all components
+        yield "✅ Done! Generated {} flashcards".format(len(all_flashcards)), csv_output, json_output, display_text
     except Exception as e:
+        error_msg = f"Error processing PDF: {str(e)}"
+        print(error_msg)
+        yield error_msg, "", "", error_msg
 def format_flashcards_display(flashcards: List[Dict]) -> str:
     """Format flashcards for nice display."""
             )
             gr.Markdown("*Raw JSON data for custom applications*")
+    # FIXED: Direct binding without the broken .then() chain
     process_btn.click(
         fn=process_pdf,
         inputs=[pdf_input, questions_per_chunk, max_chunks],
+        outputs=[status_text, csv_output, json_output, output_display]
     )
     # Example section