Spaces:

mk1985
/

Historical-Text-Analyser

Sleeping

App Files Files Community

mk1985 commited on Jul 23, 2025

Commit

1773b6d

verified ·

1 Parent(s): d56dd19

Update app.py

Browse files

Files changed (1) hide show

app.py +15 -12

app.py CHANGED Viewed

@@ -10,9 +10,9 @@ import gradio as gr
 from gliner import GLiNER
 from collections import defaultdict
 import numpy as np
-import pandas as pd # Import pandas for DataFrame
 import os
-import tempfile # For creating temporary CSV files
 # 🧠 Supported models and their providers
 MODEL_OPTIONS = {
@@ -69,7 +69,6 @@ def generate_from_prompt(prompt, provider, key_dict):
     return ""
 # --- UI Definitions ---
 STANDARD_LABELS = [
     "Person", "Organization", "Location", "Country", "City", "State",
     "Nationality", "Group", "Date", "Event", "Law", "Legal Document",
@@ -153,15 +152,25 @@ with gr.Blocks(title="Historical Text Analysis Tool", css=".prose { word-break:
             key_dict = {"openai_key": os.environ.get("OPENAI_API_KEY", openai_k), "anthropic_key": os.environ.get("ANTHROPIC_API_KEY", anthropic_k), "google_key": os.environ.get("GOOGLE_API_KEY", google_k)}
             provider_id = MODEL_OPTIONS.get(provider)
             if not topic or not provider or not key_dict.get(f"{provider_id}_key"): raise gr.Error("A topic, provider, and valid API Key for that provider are required.")
             prompt = FRAMEWORK_PROMPT_TEMPLATE.format(topic=topic)
             raw_framework = generate_from_prompt(prompt, provider, key_dict)
             framework = defaultdict(list)
             current_category = None
             for line in raw_framework.split('\n'):
                 line = line.strip()
-                if line.startswith("###"): current_category = line.replace("###", "").strip()
-                elif line.startswith("-") and current_category: framework[current_category].extend([e.strip() for e in entities.split(',') if e.strip()])
             if not framework: raise gr.Error("The AI failed to generate categories. Please try again or rephrase your topic.")
             updates = {}
             categories = list(framework.items())
             for i in range(MAX_CATEGORIES):
@@ -178,6 +187,7 @@ with gr.Blocks(title="Historical Text Analysis Tool", css=".prose { word-break:
                     updates[cg] = gr.update(choices=[], value=[], visible=False)
                     updates[sel] = gr.update(visible=False)
                     updates[desel] = gr.update(visible=False)
             updates[generate_btn] = gr.update(value="Generate Framework", interactive=True)
             yield updates
         except Exception as e:
@@ -241,8 +251,6 @@ with gr.Blocks(title="Historical Text Analysis Tool", css=".prose { word-break:
         results_df = pd.DataFrame(table_rows)
         if not results_df.empty: results_df = results_df.sort_values(by=["Label", "Instances"], ascending=[True, False])
-        # *** BUG FIX IS HERE ***
-        # The final dictionary MUST include a key for every component in the `outputs` list.
         yield {
             analyze_btn: gr.update(value="Find Entities", interactive=True),
             analysis_status: gr.update(visible=False),
@@ -250,20 +258,15 @@ with gr.Blocks(title="Historical Text Analysis Tool", css=".prose { word-break:
             detailed_results_output: results_df,
             results_state: results_df,
             debug_output: "Analysis complete.",
-            # This line was missing, which caused the bug.
             csv_file_output: gr.update(visible=False, value=None)
         }
     def export_to_csv(df):
         if df is None or df.empty:
             gr.Info("No data to export. Please run 'Find Entities' first.")
-            # Return an update to ensure the component remains hidden
             return gr.update(visible=False)
-        # Use a temporary file that Gradio can access
         with tempfile.NamedTemporaryFile(delete=False, mode='w', suffix='.csv', encoding='utf-8') as tmpfile:
             df.to_csv(tmpfile.name, index=False)
-            # Return an update with the file path and set visibility to True
             return gr.update(value=tmpfile.name, visible=True)
     # --- Wire up UI events ---

 from gliner import GLiNER
 from collections import defaultdict
 import numpy as np
+import pandas as pd
 import os
+import tempfile
 # 🧠 Supported models and their providers
 MODEL_OPTIONS = {
     return ""
 # --- UI Definitions ---
 STANDARD_LABELS = [
     "Person", "Organization", "Location", "Country", "City", "State",
     "Nationality", "Group", "Date", "Event", "Law", "Legal Document",
             key_dict = {"openai_key": os.environ.get("OPENAI_API_KEY", openai_k), "anthropic_key": os.environ.get("ANTHROPIC_API_KEY", anthropic_k), "google_key": os.environ.get("GOOGLE_API_KEY", google_k)}
             provider_id = MODEL_OPTIONS.get(provider)
             if not topic or not provider or not key_dict.get(f"{provider_id}_key"): raise gr.Error("A topic, provider, and valid API Key for that provider are required.")
             prompt = FRAMEWORK_PROMPT_TEMPLATE.format(topic=topic)
             raw_framework = generate_from_prompt(prompt, provider, key_dict)
             framework = defaultdict(list)
             current_category = None
             for line in raw_framework.split('\n'):
                 line = line.strip()
+                if line.startswith("###"):
+                    current_category = line.replace("###", "").strip()
+                # *** BUG FIX WAS HERE ***
+                elif line.startswith("-") and current_category:
+                    # Correctly assign the line content to a variable first
+                    entities_string = line.replace("-", "").strip()
+                    # Then use that variable
+                    framework[current_category].extend([e.strip() for e in entities_string.split(',') if e.strip()])
             if not framework: raise gr.Error("The AI failed to generate categories. Please try again or rephrase your topic.")
             updates = {}
             categories = list(framework.items())
             for i in range(MAX_CATEGORIES):
                     updates[cg] = gr.update(choices=[], value=[], visible=False)
                     updates[sel] = gr.update(visible=False)
                     updates[desel] = gr.update(visible=False)
             updates[generate_btn] = gr.update(value="Generate Framework", interactive=True)
             yield updates
         except Exception as e:
         results_df = pd.DataFrame(table_rows)
         if not results_df.empty: results_df = results_df.sort_values(by=["Label", "Instances"], ascending=[True, False])
         yield {
             analyze_btn: gr.update(value="Find Entities", interactive=True),
             analysis_status: gr.update(visible=False),
             detailed_results_output: results_df,
             results_state: results_df,
             debug_output: "Analysis complete.",
             csv_file_output: gr.update(visible=False, value=None)
         }
     def export_to_csv(df):
         if df is None or df.empty:
             gr.Info("No data to export. Please run 'Find Entities' first.")
             return gr.update(visible=False)
         with tempfile.NamedTemporaryFile(delete=False, mode='w', suffix='.csv', encoding='utf-8') as tmpfile:
             df.to_csv(tmpfile.name, index=False)
             return gr.update(value=tmpfile.name, visible=True)
     # --- Wire up UI events ---