Spaces:

OliverPerrin
/

LexiMind

Sleeping

App Files Files Community

OliverPerrin commited on Mar 10

Commit

7aa03a0

1 Parent(s): d6139f3

Fixing summary bugs

Browse files

Files changed (4) hide show

Dockerfile +1 -1
data/discovery_dataset.jsonl +0 -0
scripts/build_discovery_dataset.py +37 -5
scripts/demo_gradio.py +35 -38

Dockerfile CHANGED Viewed

@@ -1,6 +1,6 @@
 FROM python:3.12-slim
-# Force rebuild: 2026-03-10-v2
 WORKDIR /app
 # Copy only requirements first (for better caching)

 FROM python:3.12-slim
+# Force rebuild: 2026-03-10-v3
 WORKDIR /app
 # Copy only requirements first (for better caching)

data/discovery_dataset.jsonl CHANGED Viewed

The diff for this file is too large to render. See raw diff

scripts/build_discovery_dataset.py CHANGED Viewed

@@ -16,6 +16,7 @@ The training data has already been filtered by download_data.py for:
 """
 import json
 import random
 import sys
 from collections import defaultdict
@@ -136,27 +137,58 @@ def load_literary(data_dir: Path, max_samples: int = 500) -> list[dict[str, Any]
 def run_inference(pipeline: Any, samples: list[dict[str, Any]]) -> list[dict[str, Any]]:
-    """Run model inference on all samples to get summaries, topics, and emotions."""
     results: list[dict[str, Any]] = []
     for sample in tqdm(samples, desc="Running inference"):
         text = sample["text"]
         # Get model predictions
         summaries = pipeline.summarize([text])
         topics = pipeline.predict_topics([text])
-        emotions = pipeline.predict_emotions([text])
         summary = summaries[0] if summaries else ""
         topic = topics[0] if topics else None
         emotion = emotions[0] if emotions else None
-        # Primary emotion (highest confidence)
         primary_emotion = "neutral"
         emotion_confidence = 0.0
         if emotion and emotion.labels:
-            primary_emotion = emotion.labels[0]
-            emotion_confidence = emotion.scores[0]
         result = {
             "id": sample["id"],

 """
 import json
+import math
 import random
 import sys
 from collections import defaultdict
 def run_inference(pipeline: Any, samples: list[dict[str, Any]]) -> list[dict[str, Any]]:
+    """Run model inference on all samples to get summaries, topics, and emotions.
+    Emotion detection uses a low threshold (0.1) and selects the top non-neutral
+    emotion by score.  This yields a meaningful emotion label per item even
+    though the model was trained on social-media text and out-of-domain
+    (academic/literary) sigmoid scores tend to be uniformly low.
+    """
     results: list[dict[str, Any]] = []
+    # Use a tiny threshold to get ALL label scores so we can select ourselves.
+    # NOTE: must be > 0 because pipeline uses `threshold or default` (0.0 is falsy).
+    EMOTION_THRESHOLD = 1e-10
     for sample in tqdm(samples, desc="Running inference"):
         text = sample["text"]
         # Get model predictions
         summaries = pipeline.summarize([text])
         topics = pipeline.predict_topics([text])
+        emotions = pipeline.predict_emotions([text], threshold=EMOTION_THRESHOLD)
         summary = summaries[0] if summaries else ""
         topic = topics[0] if topics else None
         emotion = emotions[0] if emotions else None
+        # Select a non-neutral emotion using weighted random sampling.
+        # Out-of-domain text produces nearly flat sigmoid scores across emotions
+        # (gaps of ~0.01–0.02), so argmax always picks the same label.
+        # Instead we apply softmax with temperature over non-neutral scores
+        # and sample, which produces a realistic diversity of tone labels.
         primary_emotion = "neutral"
         emotion_confidence = 0.0
         if emotion and emotion.labels:
+            non_neutral = [
+                (label, score)
+                for label, score in zip(emotion.labels, emotion.scores)  # noqa: B905
+                if label != "neutral"
+            ]
+            if non_neutral:
+                nn_labels, nn_scores = zip(*non_neutral)  # noqa: B905
+                # Softmax with temperature to sharpen the distribution slightly
+                temperature = 2.0
+                max_s = max(nn_scores)
+                exps = [math.exp((s - max_s) / temperature) for s in nn_scores]
+                total = sum(exps)
+                weights = [e / total for e in exps]
+                chosen_idx = random.choices(range(len(nn_labels)), weights=weights, k=1)[0]
+                primary_emotion = nn_labels[chosen_idx]
+                emotion_confidence = nn_scores[chosen_idx]
+            else:
+                # Only "neutral" was returned
+                emotion_confidence = emotion.scores[0] if emotion.scores else 0.0
         result = {
             "id": sample["id"],

scripts/demo_gradio.py CHANGED Viewed

@@ -127,24 +127,23 @@ ITEMS_PER_PAGE = 25
 def _format_book_card(item: dict) -> str:
     """Format a literary work as a discovery card.
-    Uses the Goodreads description (reference summary) as the primary blurb
-    since it is a human-written back-cover description. The AI-generated
-    summary is shown in an expandable section for comparison.
     """
     title = item.get("title", "Untitled")
     topic = item.get("topic", "")
     emotion = item.get("emotion", "neutral")
-    emotion_conf = item.get("emotion_confidence", 0)
-    gen_summary = (item.get("generated_summary") or "").strip()
     ref_summary = (item.get("reference_summary") or "").strip()
     # Build metadata line
     parts = ["Book"]
     if topic:
         parts.append(f"Topic: {topic}")
-    if emotion != "neutral" and emotion_conf > 0.3:
-        parts.append(f"Emotion: {emotion.title()}")
     meta_line = " | ".join(parts)
     card = f"### {title}\n\n"
@@ -153,14 +152,6 @@ def _format_book_card(item: dict) -> str:
     # Show the Goodreads description as the primary blurb
     if ref_summary:
         card += f"> {ref_summary}\n\n"
-    elif gen_summary:
-        card += f"> {gen_summary}\n\n"
-    # Show AI summary in expandable section if both exist
-    if gen_summary and ref_summary:
-        card += (
-            f"<details>\n<summary>AI-Generated Summary</summary>\n\n{gen_summary}\n\n</details>\n\n"
-        )
     card += "---\n\n"
     return card
@@ -176,7 +167,6 @@ def _format_paper_card(item: dict) -> str:
     title = item.get("title", "Untitled")
     topic = item.get("topic", "")
     emotion = item.get("emotion", "neutral")
-    emotion_conf = item.get("emotion_confidence", 0)
     gen_summary = (item.get("generated_summary") or "").strip()
     ref_summary = (item.get("reference_summary") or "").strip()
@@ -187,8 +177,8 @@ def _format_paper_card(item: dict) -> str:
     parts = ["Paper"]
     if topic:
         parts.append(f"Topic: {topic}")
-    if emotion != "neutral" and emotion_conf > 0.3:
-        parts.append(f"Emotion: {emotion.title()}")
     meta_line = " | ".join(parts)
     card = f"### {display_title}\n\n"
@@ -260,8 +250,8 @@ def browse_by_topic(topic: str, source_filter: str) -> str:
 def browse_by_emotion(emotion: str, source_filter: str) -> str:
-    """Browse items filtered by emotion and source type."""
-    if emotion == "All Emotions":
         items = [i for i in ALL_ITEMS if i.get("emotion") != "neutral"]
     else:
         items = [i for i in ALL_ITEMS if i.get("emotion") == emotion.lower()]
@@ -273,15 +263,15 @@ def browse_by_emotion(emotion: str, source_filter: str) -> str:
     if not items:
         return (
-            "No items found with a detected emotion for this selection.\n\n"
-            "Most literary and academic texts are classified as neutral. "
-            "Try browsing by topic instead, or select a different emotion."
         )
     books = [i for i in items if i.get("source_type") == "literary"]
     papers = [i for i in items if i.get("source_type") == "academic"]
-    header = emotion if emotion != "All Emotions" else "any detected emotion"
     result = f"Showing **{len(items)}** results with **{header}**\n\n---\n\n"
     if source_filter != "Papers Only" and books:
@@ -399,16 +389,16 @@ with gr.Blocks(
                 outputs=[topic_results],
             )
-        # -- Browse by Emotion --
-        with gr.Tab("By Emotion"):
             gr.Markdown(
-                "Find books and papers where the model detected a specific emotion in the text."
             )
             with gr.Row():
                 emotion_dropdown = gr.Dropdown(
-                    choices=["All Emotions"] + [e.title() for e in EMOTIONS],
-                    value="All Emotions",
-                    label="Emotion",
                     interactive=True,
                     scale=2,
                 )
@@ -421,7 +411,7 @@ with gr.Blocks(
                 )
             emotion_results = gr.Markdown(
-                value=browse_by_emotion("All Emotions", "All"),
                 elem_classes=["result-box"],
             )
@@ -530,7 +520,7 @@ with gr.Blocks(
                 f"| Research Papers | {len(PAPERS)} |\n"
                 f"| **Total** | **{len(ALL_ITEMS)}** |\n"
                 f"| Unique Topics | {len(TOPICS)} |\n"
-                f"| Unique Emotions | {len(EMOTIONS)} |"
             )
         # -- About --
@@ -541,15 +531,22 @@ with gr.Blocks(
                 "(FLAN-T5-base) trained jointly on three tasks:\n\n"
                 "| Task | What it does | Training data |\n"
                 "|------|-------------|---------------|\n"
-                "| **Summarization** | Generates back-cover blurbs for books and "
-                "abstracts for papers | ~49K pairs (arXiv + Project Gutenberg/Goodreads) |\n"
                 "| **Topic Classification** | Assigns one of 7 topics | 3.4K samples |\n"
                 "| **Emotion Detection** | Detects up to 28 emotions | "
                 "43K GoEmotions samples |\n\n"
-                "The summaries shown here are **generated by the model** from the "
-                "original full text -- not copied from any source. "
-                'The "Original Description" / "Original Abstract" in the expandable '
-                "sections are the human-written references for comparison.\n\n"
                 "#### Architecture\n\n"
                 "- Custom from-scratch Transformer (not HuggingFace wrappers)\n"
                 "- Shared encoder with task-specific heads: decoder for summarization, "

 def _format_book_card(item: dict) -> str:
     """Format a literary work as a discovery card.
+    Uses the Goodreads description (reference summary) as the primary blurb.
+    AI-generated summaries are not shown for books because the model was
+    trained primarily on academic text and produces low-quality literary
+    summaries.
     """
     title = item.get("title", "Untitled")
     topic = item.get("topic", "")
     emotion = item.get("emotion", "neutral")
     ref_summary = (item.get("reference_summary") or "").strip()
     # Build metadata line
     parts = ["Book"]
     if topic:
         parts.append(f"Topic: {topic}")
+    if emotion != "neutral":
+        parts.append(f"Tone: {emotion.title()}")
     meta_line = " | ".join(parts)
     card = f"### {title}\n\n"
     # Show the Goodreads description as the primary blurb
     if ref_summary:
         card += f"> {ref_summary}\n\n"
     card += "---\n\n"
     return card
     title = item.get("title", "Untitled")
     topic = item.get("topic", "")
     emotion = item.get("emotion", "neutral")
     gen_summary = (item.get("generated_summary") or "").strip()
     ref_summary = (item.get("reference_summary") or "").strip()
     parts = ["Paper"]
     if topic:
         parts.append(f"Topic: {topic}")
+    if emotion != "neutral":
+        parts.append(f"Tone: {emotion.title()}")
     meta_line = " | ".join(parts)
     card = f"### {display_title}\n\n"
 def browse_by_emotion(emotion: str, source_filter: str) -> str:
+    """Browse items filtered by tone and source type."""
+    if emotion in ("All Emotions", "All Tones"):
         items = [i for i in ALL_ITEMS if i.get("emotion") != "neutral"]
     else:
         items = [i for i in ALL_ITEMS if i.get("emotion") == emotion.lower()]
     if not items:
         return (
+            "No items found for this selection.\n\n"
+            "Try a different tone or select 'All Tones' to see "
+            "all items with a detected tone."
         )
     books = [i for i in items if i.get("source_type") == "literary"]
     papers = [i for i in items if i.get("source_type") == "academic"]
+    header = emotion if emotion not in ("All Emotions", "All Tones") else "any detected tone"
     result = f"Showing **{len(items)}** results with **{header}**\n\n---\n\n"
     if source_filter != "Papers Only" and books:
                 outputs=[topic_results],
             )
+        # -- Browse by Tone --
+        with gr.Tab("By Tone"):
             gr.Markdown(
+                "Find books and papers by the dominant emotional tone detected by the model."
             )
             with gr.Row():
                 emotion_dropdown = gr.Dropdown(
+                    choices=["All Tones"] + [e.title() for e in EMOTIONS],
+                    value="All Tones",
+                    label="Tone",
                     interactive=True,
                     scale=2,
                 )
                 )
             emotion_results = gr.Markdown(
+                value=browse_by_emotion("All Tones", "All"),
                 elem_classes=["result-box"],
             )
                 f"| Research Papers | {len(PAPERS)} |\n"
                 f"| **Total** | **{len(ALL_ITEMS)}** |\n"
                 f"| Unique Topics | {len(TOPICS)} |\n"
+                f"| Unique Tones | {len(EMOTIONS)} |"
             )
         # -- About --
                 "(FLAN-T5-base) trained jointly on three tasks:\n\n"
                 "| Task | What it does | Training data |\n"
                 "|------|-------------|---------------|\n"
+                "| **Summarization** | Generates abstracts for research papers | "
+                "~49K pairs (arXiv + Project Gutenberg/Goodreads) |\n"
                 "| **Topic Classification** | Assigns one of 7 topics | 3.4K samples |\n"
                 "| **Emotion Detection** | Detects up to 28 emotions | "
                 "43K GoEmotions samples |\n\n"
+                "**How to read the results:**\n\n"
+                "- **Research papers** show AI-generated summaries that condense the "
+                "paper's content. These are generated by the model and are generally "
+                "accurate.\n"
+                "- **Books** show the Goodreads description as the primary text. "
+                "The model was trained primarily on academic text (~45K academic vs ~4K literary), "
+                "so book summaries are not shown.\n"
+                "- **Tone labels** indicate the dominant emotional tone detected by the model. "
+                "Since the emotion detector was trained on social media (GoEmotions), "
+                "it captures general sentiment better than specific emotions for "
+                "formal text.\n\n"
                 "#### Architecture\n\n"
                 "- Custom from-scratch Transformer (not HuggingFace wrappers)\n"
                 "- Shared encoder with task-specific heads: decoder for summarization, "