Spaces:

Deevyankar
/

Handouts

Sleeping

App Files Files Community

Deevyankar commited on Sep 21, 2025

Commit

e293e42

verified ·

1 Parent(s): 7889bda

Update app.py

Browse files

Files changed (1) hide show

app.py +17 -6

app.py CHANGED Viewed

@@ -1,4 +1,3 @@
 import gradio as gr
 import fitz  # PyMuPDF
 import docx
@@ -7,6 +6,7 @@ import re
 import os
 import matplotlib.pyplot as plt
 import numpy as np
 from sklearn.feature_extraction.text import TfidfVectorizer
 from sentence_transformers import SentenceTransformer, util
 from difflib import SequenceMatcher
@@ -62,11 +62,11 @@ def compare_handouts(old_pdf, new_pdf, lo_file):
     new_text = extract_text_from_pdf(new_pdf)
     if len(old_text.strip()) < 200 or len(new_text.strip()) < 200:
-        return "⚠️ Could not extract meaningful content from one or both PDFs.", None
     lo_list = extract_text_from_docx(lo_file)
     if not lo_list:
-        return "⚠️ No learning outcomes detected.", None
     old_scores = semantic_match(lo_list, old_text)
     new_scores = semantic_match(lo_list, new_text)
@@ -82,6 +82,16 @@ def compare_handouts(old_pdf, new_pdf, lo_file):
     else:
         summary += "⚠️ Summary: No significant improvement in LO alignment."
     # Plot
     x = np.arange(len(lo_list))
     width = 0.35
@@ -95,7 +105,7 @@ def compare_handouts(old_pdf, new_pdf, lo_file):
     ax.legend()
     plt.tight_layout()
-    return summary, fig
 with gr.Blocks() as demo:
     gr.Markdown("📘 **Educational Content Comparator**")
@@ -112,8 +122,9 @@ with gr.Blocks() as demo:
     output_text = gr.Textbox(label="📋 Summary", lines=5, interactive=False)
     output_plot = gr.Plot(label="📊 LO Match Chart")
-    btn.click(fn=compare_handouts, inputs=[old_pdf, new_pdf, lo_file], outputs=[output_text, output_plot])
-    clear_btn.click(fn=lambda: ("", None), inputs=[], outputs=[output_text, output_plot])
 demo.launch()

 import gradio as gr
 import fitz  # PyMuPDF
 import docx
 import os
 import matplotlib.pyplot as plt
 import numpy as np
+import pandas as pd
 from sklearn.feature_extraction.text import TfidfVectorizer
 from sentence_transformers import SentenceTransformer, util
 from difflib import SequenceMatcher
     new_text = extract_text_from_pdf(new_pdf)
     if len(old_text.strip()) < 200 or len(new_text.strip()) < 200:
+        return "⚠️ Could not extract meaningful content from one or both PDFs.", None, None
     lo_list = extract_text_from_docx(lo_file)
     if not lo_list:
+        return "⚠️ No learning outcomes detected.", None, None
     old_scores = semantic_match(lo_list, old_text)
     new_scores = semantic_match(lo_list, new_text)
     else:
         summary += "⚠️ Summary: No significant improvement in LO alignment."
+    # Create comparison table
+    df = pd.DataFrame({
+        "Learning Outcome": [f"LO{i+1}" for i in range(len(lo_list))],
+        "Old Match Score": old_scores,
+        "New Match Score": new_scores,
+        "Improvement": np.array(new_scores) - np.array(old_scores)
+    })
+    excel_path = "/mnt/data/LO_Comparison_Report.xlsx"
+    df.to_excel(excel_path, index=False)
     # Plot
     x = np.arange(len(lo_list))
     width = 0.35
     ax.legend()
     plt.tight_layout()
+    return summary, fig, excel_path
 with gr.Blocks() as demo:
     gr.Markdown("📘 **Educational Content Comparator**")
     output_text = gr.Textbox(label="📋 Summary", lines=5, interactive=False)
     output_plot = gr.Plot(label="📊 LO Match Chart")
+    output_excel = gr.File(label="📄 Download Excel Report")
+    btn.click(fn=compare_handouts, inputs=[old_pdf, new_pdf, lo_file], outputs=[output_text, output_plot, output_excel])
+    clear_btn.click(fn=lambda: ("", None, None), inputs=[], outputs=[output_text, output_plot, output_excel])
 demo.launch()