Spaces:

ai-sentiment-group
/

BootcampFinalProject

Sleeping

App Files Files Community

alexoh2020 commited on Aug 25, 2025

Commit

0f2373c

1 Parent(s): 097fe34

added VADER sentiment analysis

Browse files

Files changed (5) hide show

.gitignore +2 -0
config.json +4 -0
requirements.txt +2 -1
src/api_handler.py +29 -35
src/streamlit_app.py +16 -10

.gitignore CHANGED Viewed

@@ -10,6 +10,8 @@ __pycache__/
 # Virtual environment
 .venv/
 venv/
 # IDE
 .vscode/

 # Virtual environment
 .venv/
 venv/
+.env/
+env/
 # IDE
 .vscode/

config.json CHANGED Viewed

@@ -28,5 +28,9 @@
     "AI breakthrough promises to revolutionize healthcare",
     "Concerns grow over AI job displacement",
     "New machine learning model shows mixed results"
   ]
 }

     "AI breakthrough promises to revolutionize healthcare",
     "Concerns grow over AI job displacement",
     "New machine learning model shows mixed results"
+  ],
+  "model_options":[
+    "Vader",
+    "TextBlob"
   ]
 }

requirements.txt CHANGED Viewed

@@ -4,4 +4,5 @@ requests>=2.31.0
 python-dotenv>=1.0.0
 textblob>=0.17.1
 plotly>=5.15.0
-numpy>=1.24.0

 python-dotenv>=1.0.0
 textblob>=0.17.1
 plotly>=5.15.0
+numpy>=1.24.0
+vaderSentiment>=3.3.2

src/api_handler.py CHANGED Viewed

@@ -10,6 +10,8 @@ import json
 from dotenv import load_dotenv
 from textblob import TextBlob
 from typing import List, Dict, Optional
 # Load environment variables
 load_dotenv()
@@ -77,7 +79,7 @@ class AINewsAnalyzer:
             print(f"Request failed: {e}")
             return []
-    def analyze_sentiment(self, text: str) -> Dict:
         """
         Analyze sentiment of given text using TextBlob
@@ -94,30 +96,39 @@ class AINewsAnalyzer:
                 'label': 'neutral',
                 'confidence': 0.0
             }
         blob = TextBlob(text)
-        polarity = blob.sentiment.polarity
         subjectivity = blob.sentiment.subjectivity
-        # Determine sentiment label
-        if polarity > 0.1:
             label = 'positive'
-        elif polarity < -0.1:
             label = 'negative'
         else:
             label = 'neutral'
         # Calculate confidence (distance from neutral)
         confidence = abs(polarity)
-        return {
             'polarity': polarity,
             'subjectivity': subjectivity,
             'label': label,
             'confidence': confidence
         }
-    def process_news_articles(self, articles: List[Dict]) -> pd.DataFrame:
         """
         Process news articles and add sentiment analysis
@@ -135,15 +146,14 @@ class AINewsAnalyzer:
                 continue
             # Analyze sentiment of title and description
-            title_sentiment = self.analyze_sentiment(article['title'])
-            description_sentiment = self.analyze_sentiment(article.get('description', ''))
             # Combine title and description sentiment (weighted toward title)
             combined_polarity = (title_sentiment['polarity'] * 0.7 +
                                description_sentiment['polarity'] * 0.3)
             combined_subjectivity = (title_sentiment['subjectivity'] * 0.7 +
                                    description_sentiment['subjectivity'] * 0.3)
             # Determine overall sentiment
             if combined_polarity > 0.1:
                 overall_sentiment = 'positive'
@@ -183,7 +193,8 @@ class AINewsAnalyzer:
     def get_ai_news_with_sentiment(self,
                                    query: str = "artificial intelligence",
                                    days: int = 7,
-                                   sources: Optional[str] = None) -> pd.DataFrame:
         """
         Complete pipeline: fetch news and analyze sentiment
@@ -207,26 +218,10 @@ class AINewsAnalyzer:
         print(f"Found {len(articles)} articles. Analyzing sentiment...")
         # Process and analyze
-        df = self.process_news_articles(articles)
-        print(f"Processed {len(df)} articles with sentiment analysis.")
         return df
-def fetch_ai_news(query="artificial intelligence", days=7, sources=None):
-    """Standalone function to fetch AI news"""
-    analyzer = AINewsAnalyzer()
-    return analyzer.fetch_ai_news(query, days, sources=sources)
-def analyze_sentiment(text):
-    """Standalone function to analyze sentiment"""
-    analyzer = AINewsAnalyzer()
-    return analyzer.analyze_sentiment(text)
-def get_ai_news_with_sentiment(query="artificial intelligence", days=7, sources=None):
-    """Standalone function for complete pipeline"""
-    analyzer = AINewsAnalyzer()
-    return analyzer.get_ai_news_with_sentiment(query, days, sources)
 def load_config():
     """Load configuration from config.json"""
     with open('config.json', 'r') as f:
@@ -247,8 +242,7 @@ if __name__ == "__main__":
     for text in test_texts:
         sentiment = analyzer.analyze_sentiment(text)
         print(f"Text: {text}")
-        print(f"Sentiment: {sentiment['label']} (polarity: {sentiment['polarity']:.2f})")
-        print()
     # Test news fetching
     print("Fetching recent AI news...")

 from dotenv import load_dotenv
 from textblob import TextBlob
 from typing import List, Dict, Optional
+from vaderSentiment.vaderSentiment import SentimentIntensityAnalyzer as SIA
 # Load environment variables
 load_dotenv()
             print(f"Request failed: {e}")
             return []
+    def analyze_sentiment(self, text: str, model: str) -> Dict:
         """
         Analyze sentiment of given text using TextBlob
                 'label': 'neutral',
                 'confidence': 0.0
             }
         blob = TextBlob(text)
         subjectivity = blob.sentiment.subjectivity
+        # implement Vader Analysis for polarity scores
+        if model == "Vader":
+            vader = SIA()
+            fullpolarity = vader.polarity_scores(text)
+            polarity=fullpolarity['compound']
+            polarity_thresh = 0.05
+        # otherwise
+        else:
+            polarity = blob.sentiment.polarity
+            polarity_thresh = 0.1
+        # Determine sentiment label through polarity threshold
+        if polarity > polarity_thresh:
             label = 'positive'
+        elif polarity < -polarity_thresh:
             label = 'negative'
         else:
             label = 'neutral'
         # Calculate confidence (distance from neutral)
         confidence = abs(polarity)
+        res = {
             'polarity': polarity,
             'subjectivity': subjectivity,
             'label': label,
             'confidence': confidence
         }
+        return res
+    def process_news_articles(self, articles: List[Dict], model: str) -> pd.DataFrame:
         """
         Process news articles and add sentiment analysis
                 continue
             # Analyze sentiment of title and description
+            title_sentiment = self.analyze_sentiment(article['title'], model=model)
+            description_sentiment = self.analyze_sentiment(article['description'], model=model)
             # Combine title and description sentiment (weighted toward title)
             combined_polarity = (title_sentiment['polarity'] * 0.7 +
                                description_sentiment['polarity'] * 0.3)
             combined_subjectivity = (title_sentiment['subjectivity'] * 0.7 +
                                    description_sentiment['subjectivity'] * 0.3)
             # Determine overall sentiment
             if combined_polarity > 0.1:
                 overall_sentiment = 'positive'
     def get_ai_news_with_sentiment(self,
                                    query: str = "artificial intelligence",
                                    days: int = 7,
+                                   sources: Optional[str] = None,
+                                   model: str = "Textblob") -> pd.DataFrame:
         """
         Complete pipeline: fetch news and analyze sentiment
         print(f"Found {len(articles)} articles. Analyzing sentiment...")
         # Process and analyze
+        df = self.process_news_articles(articles, model=model)
+        print(f"Processed {len(df)} articles with sentiment analysis. \nUsed {model} for polarity analysis and Textblob for sentiment analysis.")
         return df
 def load_config():
     """Load configuration from config.json"""
     with open('config.json', 'r') as f:
     for text in test_texts:
         sentiment = analyzer.analyze_sentiment(text)
         print(f"Text: {text}")
+        print(f"Sentiment: {sentiment['label']} (polarity: {sentiment['polarity']:.2f}\n")
     # Test news fetching
     print("Fetching recent AI news...")

src/streamlit_app.py CHANGED Viewed

@@ -19,7 +19,7 @@ st.set_page_config(
 # Custom CSS for better styling
 st.markdown("""
-<style>
     .main-header {
         font-size: 2.5rem;
         font-weight: bold;
@@ -46,11 +46,11 @@ def load_config():
         return json.load(f)
 @st.cache_data(ttl=1800)  # Cache for 30 minutes
-def load_news_data(query, days, sources=None):
     """Load and cache news data"""
     try:
         analyzer = AINewsAnalyzer()
-        df = analyzer.get_ai_news_with_sentiment(query=query, days=days, sources=sources)
         return df, None
     except Exception as e:
         return pd.DataFrame(), str(e)
@@ -105,7 +105,7 @@ def create_source_analysis(df):
     return fig
-def create_polarity_distribution(df):
     """Create sentiment polarity distribution"""
     if df.empty:
         return None
@@ -119,10 +119,9 @@ def create_polarity_distribution(df):
     )
     # Add vertical lines for sentiment boundaries
-    fig.add_vline(x=0.1, line_dash="dash", line_color="green", annotation_text="Positive Threshold")
-    fig.add_vline(x=-0.1, line_dash="dash", line_color="red", annotation_text="Negative Threshold")
-    fig.add_vline(x=0, line_dash="dash", line_color="gray", annotation_text="Neutral")
     return fig
@@ -150,6 +149,12 @@ def main():
         "Or enter custom search:",
         placeholder="e.g., 'generative AI'"
     )
     # Use custom query if provided
     final_query = custom_query if custom_query else selected_query
@@ -186,7 +191,7 @@ def main():
     # Load data
     if st.sidebar.button("🚀 Analyze News", type="primary"):
         with st.spinner(f"Fetching and analyzing news about '{final_query}'..."):
-            df, error = load_news_data(final_query, days, sources)
             if error:
                 st.error(f"Error loading data: {error}")
@@ -242,7 +247,8 @@ def main():
                 st.plotly_chart(source_fig, use_container_width=True)
         # Row 2: Polarity distribution (full width)
-        polarity_fig = create_polarity_distribution(df)
         if polarity_fig:
             st.plotly_chart(polarity_fig, use_container_width=True)

 # Custom CSS for better styling
 st.markdown("""
+<style>
     .main-header {
         font-size: 2.5rem;
         font-weight: bold;
         return json.load(f)
 @st.cache_data(ttl=1800)  # Cache for 30 minutes
+def load_news_data(query, days, sources=None, model="TextBlob"):
     """Load and cache news data"""
     try:
         analyzer = AINewsAnalyzer()
+        df = analyzer.get_ai_news_with_sentiment(query=query, days=days, sources=sources, model=model)
         return df, None
     except Exception as e:
         return pd.DataFrame(), str(e)
     return fig
+def create_polarity_distribution(df, thresh: float):
     """Create sentiment polarity distribution"""
     if df.empty:
         return None
     )
     # Add vertical lines for sentiment boundaries
+    fig.add_vline(x=thresh, line_dash="dash", line_color="green", annotation_text="Positive Threshold", annotation_position="top right")
+    fig.add_vline(x=-thresh, line_dash="dash", line_color="red", annotation_text="Negative Threshold", annotation_position="top left")
+    fig.add_vline(x=0, line_dash="dash", line_color="gray", annotation_text="Neutral", annotation_position="top")
     return fig
         "Or enter custom search:",
         placeholder="e.g., 'generative AI'"
     )
+    model_query = st.sidebar.selectbox(
+        "📝 Search a Sentiment Model:",
+        options=config["model_options"],
+        index=0
+    )
     # Use custom query if provided
     final_query = custom_query if custom_query else selected_query
     # Load data
     if st.sidebar.button("🚀 Analyze News", type="primary"):
         with st.spinner(f"Fetching and analyzing news about '{final_query}'..."):
+            df, error = load_news_data(final_query, days, sources=sources, model=model_query)
             if error:
                 st.error(f"Error loading data: {error}")
                 st.plotly_chart(source_fig, use_container_width=True)
         # Row 2: Polarity distribution (full width)
+        thresh = 0.05 if model_query == "Vader" else 0.1
+        polarity_fig = create_polarity_distribution(df, thresh=thresh)
         if polarity_fig:
             st.plotly_chart(polarity_fig, use_container_width=True)