Spaces:

Tanmoy-AI
/

customer-connect

Sleeping

App Files Files Community

FarhinSadia commited on Jun 20, 2025

Commit

47dd793

1 Parent(s): 3b875a3

fixed the sentiment analysis

Browse files

Files changed (1) hide show

src/data_processor.py +10 -4

src/data_processor.py CHANGED Viewed

@@ -5,7 +5,7 @@ import re
 from textblob import TextBlob
 import numpy as np
 import json
-import streamlit as st
 try:
     import openai
@@ -25,7 +25,6 @@ class DataProcessor:
     def __init__(self, openai_api_key=None):
         self.processed_data = None
         if NLTK_AVAILABLE:
             try:
                 self.sia = SentimentIntensityAnalyzer()
@@ -34,7 +33,6 @@ class DataProcessor:
         else:
             self.sia = None
         self.use_gpt = False
         if openai_api_key and OPENAI_AVAILABLE:
             openai.api_key = openai_api_key
@@ -186,7 +184,7 @@ class DataProcessor:
         text_lower = str(text).lower()
-        if '?' in text_lower or any(phrase in text_lower for phrase in ['how do', 'what is', 'when', 'where', 'can i', 'could you']):
             return 'Inquiry', 'Contains questions or information seeking'
         elif any(word in text_lower for word in ['complaint', 'problem', 'issue', 'error', 'failed', 'not working', 'terrible', 'worst']):
             return 'Complaint', 'Contains complaint or problem description'
@@ -223,6 +221,14 @@ class DataProcessor:
         df[['emotion', 'emotion_keywords']] = df['text'].apply(lambda x: pd.Series(self.detect_emotion(x)))
         df[['category', 'category_reason']] = df['text'].apply(lambda x: pd.Series(self.categorize_post(x)))
         df['viral_score'] = 0
         if 'likes' in df.columns:
             df['viral_score'] += df['likes'].fillna(0)

 from textblob import TextBlob
 import numpy as np
 import json
+import streamlit as st
 try:
     import openai
     def __init__(self, openai_api_key=None):
         self.processed_data = None
         if NLTK_AVAILABLE:
             try:
                 self.sia = SentimentIntensityAnalyzer()
         else:
             self.sia = None
         self.use_gpt = False
         if openai_api_key and OPENAI_AVAILABLE:
             openai.api_key = openai_api_key
         text_lower = str(text).lower()
+        if '?' in text_lower or any(phrase in text_lower for phrase in ['how do', 'what is', 'when', 'where', 'can i', 'could you', 'explain']):
             return 'Inquiry', 'Contains questions or information seeking'
         elif any(word in text_lower for word in ['complaint', 'problem', 'issue', 'error', 'failed', 'not working', 'terrible', 'worst']):
             return 'Complaint', 'Contains complaint or problem description'
         df[['emotion', 'emotion_keywords']] = df['text'].apply(lambda x: pd.Series(self.detect_emotion(x)))
         df[['category', 'category_reason']] = df['text'].apply(lambda x: pd.Series(self.categorize_post(x)))
+        # --- START OF FIX ---
+        # This is the new, crucial part.
+        # It corrects the sentiment for any post that was categorized as an 'Inquiry'.
+        # This fixes the issue where questions were incorrectly marked as 'Positive'.
+        df.loc[df['category'] == 'Inquiry', 'sentiment'] = 'Neutral'
+        df.loc[df['category'] == 'Inquiry', 'polarity'] = 0.0
+        # --- END OF FIX ---
         df['viral_score'] = 0
         if 'likes' in df.columns:
             df['viral_score'] += df['likes'].fillna(0)