Spaces:

Human-AI-ETH
/

FrameVis

Sleeping

App Files Files Community

NKessler commited on 11 days ago

Commit

7da623a

verified ·

1 Parent(s): 2d595a6

Update app.py

Browse files

Files changed (1) hide show

app.py +118 -93

app.py CHANGED Viewed

@@ -6,24 +6,14 @@ import streamlit as st
 from keybert import KeyBERT
 from textblob import TextBlob
 from transformers import pipeline
 # constants
 MAX_TEXT_LENGTH = 1500
-# tone list
-CANDIDATE_TONES = [
-    "objective", "alarmist", "defensive", "optimistic", "critical",
-    "sensationalist", "somber", "sympathetic", "hostile", "satirical",
-    "urgent", "dismissive", "patriotic", "cynical", "apologetic"
-]
-ARTICLE_A = """
-Global leaders achieved a historic breakthrough today, signing a comprehensive climate accord aimed at drastically slashing carbon emissions by 2030. Environmental advocates are celebrating the mandate, which forces heavy-polluting industries to finally take accountability for their ecological damage. While corporations warn of transition costs, scientists emphasize that failing to act now would result in catastrophic, irreversible damage to our planet's fragile ecosystems.
-"""
-ARTICLE_B = """
-A sweeping new climate agreement signed today is drawing fierce criticism from industry leaders, who warn the aggressive emission targets will cripple economic growth. The heavy-handed regulations impose massive compliance costs on the manufacturing and energy sectors, inevitably leading to significant job losses and higher prices for consumers. Critics argue the rushed accord prioritizes bureaucratic posturing over practical, market-driven solutions to environmental concerns.
-"""
 @st.cache_resource
@@ -32,61 +22,81 @@ def _load_nlp_models() -> typing.Dict[str, typing.Any]:
     Loads NLP models into memory and caches them.
     """
     sentiment_analyzer = pipeline(
-        "sentiment-analysis",
-        model="distilbert-base-uncased-finetuned-sst-2-english",
     )
-    tone_classifier = pipeline(
-        "zero-shot-classification",
-        model="typeform/distilbert-base-uncased-mnli",
     )
     keyword_extractor = KeyBERT(model="all-mpnet-base-v2")
     return {
         "sentiment": sentiment_analyzer,
-        "tone": tone_classifier,
         "keyword": keyword_extractor,
     }
 def analyze_article(text: str) -> dict:
-    """Analyzes framing using semantic keyphrases, sentiment, tone and subjectivity."""
     models = _load_nlp_models()
     safe_text = text[:MAX_TEXT_LENGTH]
     # Sentiment Analysis
     sentiment_result = models["sentiment"](safe_text)[0]
-    is_positive = sentiment_result["label"] == "POSITIVE"
-    sentiment_score = (
-        sentiment_result["score"] if is_positive else -sentiment_result["score"]
-    )
-    # Tone Classification
-    tone_result = models["tone"](safe_text, CANDIDATE_TONES)
-    tone_scores = {
-        label: score
-        for label, score in zip(tone_result["labels"][:5], tone_result["scores"][:5])
-    }
     # Semantic Keyword Extraction
     keyword_results = models["keyword"].extract_keywords(
-        safe_text,
-        keyphrase_ngram_range=(1, 3),
-        stop_words="english",
         use_mmr=True,
         diversity=0.6,
         top_n=5
     )
     extracted_keywords = [kw[0] for kw in keyword_results]
-    # Subjectivity Analysis
     subjectivity_score = TextBlob(safe_text).sentiment.subjectivity
     return {
         "sentiment_score": sentiment_score,
         "subjectivity_score": subjectivity_score,
-        "primary_tone": tone_result["labels"][0],
         "tone_scores": tone_scores,
         "keywords": extracted_keywords,
     }
@@ -102,9 +112,9 @@ def _create_sentiment_gauge(score: float, title: str) -> go.Figure:
                 "axis": {"range": [-1, 1], "tickwidth": 1},
                 "bar": {"color": "darkblue"},
                 "steps": [
-                    {"range": [-1, -0.2], "color": "#ffb3b3"},
-                    {"range": [-0.2, 0.2], "color": "#f2f2f2"},
-                    {"range": [0.2, 1], "color": "#b3ffb3"},
                 ],
             },
         )
@@ -113,28 +123,32 @@ def _create_sentiment_gauge(score: float, title: str) -> go.Figure:
     return fig
-def _create_tone_bar_chart(tone_scores: typing.Dict[str, float]) -> go.Figure:
-    """Generates a horizontal bar chart showing tone probabilities."""
-    labels = list(tone_scores.keys())
-    values = list(tone_scores.values())
-    fig = go.Figure(
-        go.Bar(
-            x=values,
-            y=labels,
-            orientation="h",
-            marker_color="#4f46e5",
-            marker_line_color="white",
-            marker_line_width=1.5
-        )
-    )
     fig.update_layout(
-        title={"text": "Top 5 Emotional Tones", "font": {"size": 16}},
-        xaxis_title="Confidence Matrix",
-        height=280,
-        margin=dict(l=20, r=20, t=60, b=20),
-        yaxis={"categoryorder": "total ascending"},
-        plot_bgcolor="rgba(0,0,0,0)",
     )
     return fig
@@ -164,56 +178,67 @@ st.title("FrameVis")
 st.markdown("##### Media bias and framing effects across global news sources.")
 st.divider()
-with st.spinner("Starting NLP model."):
     _load_nlp_models()
 col1, col2 = st.columns(2)
 with col1:
     user_article_a = st.text_area("Data Source A", value=ARTICLE_A.strip(), height=220)
-    if st.button("Analyze A", use_container_width=True):
-        with st.spinner("Processing Source A."):
-            st.session_state.results_a = analyze_article(user_article_a)
 with col2:
     user_article_b = st.text_area("Data Source B", value=ARTICLE_B.strip(), height=220)
-    if st.button("Analyze B", use_container_width=True):
-        with st.spinner("Processing Source B."):
-            st.session_state.results_b = analyze_article(user_article_b)
-st.write("")
-# Analysis Display
-if st.session_state.results_a or st.session_state.results_b:
     st.markdown("### Framing Analytics & Comparison")
     res_col1, res_col2 = st.columns(2)
     # Render Column A
     with res_col1:
-        if st.session_state.results_a:
-            r_a = st.session_state.results_a
-            m1, m2 = st.columns(2)
-            m1.metric("Subjectivity", f"{r_a['subjectivity_score']:.2f}", help="0.0 = Objective, 1.0 = Highly Opinionated")
-            m2.metric("Primary Tone", r_a['primary_tone'].title())
-            st.plotly_chart(_create_sentiment_gauge(r_a["sentiment_score"], "Sentiment Bias"), use_container_width=True)
-            st.plotly_chart(_create_tone_bar_chart(r_a["tone_scores"]), use_container_width=True)
-            st.markdown("**Key Framing Language:**")
-            annotated_text = _highlight_keywords(user_article_a, r_a["keywords"])
-            st.markdown(f"<div style='background-color: #f8fafc; padding: 1rem; border-radius: 8px; border: 1px solid #e2e8f0;'>{annotated_text}</div>", unsafe_allow_html=True)
     # Render Column B
     with res_col2:
-        if st.session_state.results_b:
-            r_b = st.session_state.results_b
-            m1, m2 = st.columns(2)
-            m1.metric("Subjectivity", f"{r_b['subjectivity_score']:.2f}", help="0.0 = Objective, 1.0 = Highly Opinionated")
-            m2.metric("Primary Tone", r_b['primary_tone'].title())
-            st.plotly_chart(_create_sentiment_gauge(r_b["sentiment_score"], "Sentiment Bias"), use_container_width=True)
-            st.plotly_chart(_create_tone_bar_chart(r_b["tone_scores"]), use_container_width=True)
-            st.markdown("**Key Framing Language:**")
-            annotated_text = _highlight_keywords(user_article_b, r_b["keywords"])
-            st.markdown(f"<div style='background-color: #f8fafc; padding: 1rem; border-radius: 8px; border: 1px solid #e2e8f0;'>{annotated_text}</div>", unsafe_allow_html=True)

 from keybert import KeyBERT
 from textblob import TextBlob
 from transformers import pipeline
+import textstat
 # constants
 MAX_TEXT_LENGTH = 1500
+ARTICLE_A = """Global leaders achieved a historic breakthrough today, signing a comprehensive climate accord aimed at drastically slashing carbon emissions by 2030. Environmental advocates are celebrating the mandate, which forces heavy-polluting industries to finally take accountability for their ecological damage. While corporations warn of transition costs, scientists emphasize that failing to act now would result in catastrophic, irreversible damage to our planet's fragile ecosystems."""
+ARTICLE_B = """A sweeping new climate agreement signed today is drawing fierce criticism from industry leaders, who warn the aggressive emission targets will cripple economic growth. The heavy-handed regulations impose massive compliance costs on the manufacturing and energy sectors, inevitably leading to significant job losses and higher prices for consumers. Critics argue the rushed accord prioritizes bureaucratic posturing over practical, market-driven solutions to environmental concerns."""
 @st.cache_resource
     Loads NLP models into memory and caches them.
     """
     sentiment_analyzer = pipeline(
+        "text-classification",
+        model="cardiffnlp/twitter-roberta-base-sentiment-latest",
+    )
+    emotion_classifier = pipeline(
+        "text-classification",
+        model="SamLowe/roberta-base-go_emotions",
+        top_k=5
     )
+    ner_extractor = pipeline(
+        "ner",
+        model="dslim/bert-base-NER",
+        aggregation_strategy="simple"
     )
     keyword_extractor = KeyBERT(model="all-mpnet-base-v2")
     return {
         "sentiment": sentiment_analyzer,
+        "emotion": emotion_classifier,
+        "ner": ner_extractor,
         "keyword": keyword_extractor,
     }
 def analyze_article(text: str) -> dict:
+    """Analyzes framing using semantic keyphrases, sentiment, emotion, readability and NER."""
     models = _load_nlp_models()
     safe_text = text[:MAX_TEXT_LENGTH]
     # Sentiment Analysis
     sentiment_result = models["sentiment"](safe_text)[0]
+    label = sentiment_result["label"].lower()
+    score = sentiment_result["score"]
+    if label == "negative":
+        sentiment_score = -score
+    elif label == "positive":
+        sentiment_score = score
+    else:
+        sentiment_score = 0.0  # Neutral
+    # Emotion Classification
+    emotion_results = models["emotion"](safe_text)[0]
+    if isinstance(emotion_results, list):
+        tone_scores = {res["label"]: res["score"] for res in emotion_results}
+        primary_tone = emotion_results[0]["label"]
+    else:
+        tone_scores = {"neutral": 1.0}
+        primary_tone = "neutral"
     # Semantic Keyword Extraction
     keyword_results = models["keyword"].extract_keywords(
+        safe_text,
+        keyphrase_ngram_range=(1, 3),
+        stop_words="english",
         use_mmr=True,
         diversity=0.6,
         top_n=5
     )
     extracted_keywords = [kw[0] for kw in keyword_results]
+    # Named Entity Recognition
+    ner_results = models["ner"](safe_text)
+    extracted_entities = list(set([ent["word"] for ent in ner_results if ent["score"] > 0.6]))
+    # Subjectivity & Readability Analysis
     subjectivity_score = TextBlob(safe_text).sentiment.subjectivity
+    reading_ease = textstat.flesch_reading_ease(safe_text)
     return {
         "sentiment_score": sentiment_score,
         "subjectivity_score": subjectivity_score,
+        "reading_ease": reading_ease,
+        "primary_tone": primary_tone,
         "tone_scores": tone_scores,
         "keywords": extracted_keywords,
+        "entities": extracted_entities,
     }
                 "axis": {"range": [-1, 1], "tickwidth": 1},
                 "bar": {"color": "darkblue"},
                 "steps": [
+                    {"range": [-1, -0.2], "color": "#ffb3b3"},
+                    {"range": [-0.2, 0.2], "color": "#f2f2f2"},
+                    {"range": [0.2, 1], "color": "#b3ffb3"},
                 ],
             },
         )
     return fig
+def _create_comparison_radar_chart(results_a: dict, results_b: dict) -> go.Figure:
+    """Generates an overlapping radar chart to compare emotions."""
+    categories = list(set(list(results_a["tone_scores"].keys()) + list(results_b["tone_scores"].keys())))
+    val_a = [results_a["tone_scores"].get(c, 0) for c in categories]
+    val_b = [results_b["tone_scores"].get(c, 0) for c in categories]
+    # Close the radar loop
+    categories.append(categories[0])
+    val_a.append(val_a[0])
+    val_b.append(val_b[0])
+    fig = go.Figure()
+    fig.add_trace(go.Scatterpolar(
+          r=val_a, theta=categories, fill='toself', name='Source A', line_color='#4f46e5'
+    ))
+    fig.add_trace(go.Scatterpolar(
+          r=val_b, theta=categories, fill='toself', name='Source B', line_color='#10b981'
+    ))
     fig.update_layout(
+      polar=dict(radialaxis=dict(visible=True, range=[0, 1])),
+      showlegend=True,
+      title={"text": "Relative Emotion Profile", "font": {"size": 18}},
+      height=450,
+      margin=dict(l=40, r=40, t=60, b=40),
     )
     return fig
 st.markdown("##### Media bias and framing effects across global news sources.")
 st.divider()
+with st.spinner("Starting NLP models."):
     _load_nlp_models()
 col1, col2 = st.columns(2)
 with col1:
     user_article_a = st.text_area("Data Source A", value=ARTICLE_A.strip(), height=220)
 with col2:
     user_article_b = st.text_area("Data Source B", value=ARTICLE_B.strip(), height=220)
+st.write("")
+# Single unified execution button
+if st.button("Analyze & Compare Sources", use_container_width=True, type="primary"):
+    with st.spinner("Analyzing framing semantics for both sources."):
+        st.session_state.results_a = analyze_article(user_article_a)
+        st.session_state.results_b = analyze_article(user_article_b)
+# Analysis Display
+if st.session_state.results_a and st.session_state.results_b:
+    st.divider()
     st.markdown("### Framing Analytics & Comparison")
+    # Radar Chart spans the top
+    st.plotly_chart(_create_comparison_radar_chart(st.session_state.results_a, st.session_state.results_b), use_container_width=True)
     res_col1, res_col2 = st.columns(2)
     # Render Column A
     with res_col1:
+        r_a = st.session_state.results_a
+        st.markdown("#### Source A Breakdown")
+        m1, m2, m3 = st.columns(3)
+        m1.metric("Subjectivity", f"{r_a['subjectivity_score']:.2f}")
+        m2.metric("Primary Emotion", r_a['primary_tone'].title())
+        m3.metric("Reading Ease", f"{r_a['reading_ease']:.1f}")
+        st.plotly_chart(_create_sentiment_gauge(r_a["sentiment_score"], "Sentiment Bias"), use_container_width=True)
+        if r_a["entities"]:
+            st.markdown(f"**Extracted Entities:** `{', '.join(r_a['entities'])}`")
+        st.markdown("**Key Framing Language:**")
+        annotated_text = _highlight_keywords(user_article_a, r_a["keywords"])
+        st.markdown(f"<div style='background-color: #f8fafc; padding: 1rem; border-radius: 8px; border: 1px solid #e2e8f0;'>{annotated_text}</div>", unsafe_allow_html=True)
     # Render Column B
     with res_col2:
+        r_b = st.session_state.results_b
+        st.markdown("#### Source B Breakdown")
+        m1, m2, m3 = st.columns(3)
+        m1.metric("Subjectivity", f"{r_b['subjectivity_score']:.2f}")
+        m2.metric("Primary Emotion", r_b['primary_tone'].title())
+        m3.metric("Reading Ease", f"{r_b['reading_ease']:.1f}")
+        st.plotly_chart(_create_sentiment_gauge(r_b["sentiment_score"], "Sentiment Bias"), use_container_width=True)
+        if r_b["entities"]:
+            st.markdown(f"**Extracted Entities:** `{', '.join(r_b['entities'])}`")
+        st.markdown("**Key Framing Language:**")
+        annotated_text = _highlight_keywords(user_article_b, r_b["keywords"])
+        st.markdown(f"<div style='background-color: #f8fafc; padding: 1rem; border-radius: 8px; border: 1px solid #e2e8f0;'>{annotated_text}</div>", unsafe_allow_html=True)