Spaces:

Kurkur99
/

Sentiment_analysis

Runtime error

Kurkur99 commited on Sep 2, 2023

Commit

0bd7d7b

1 Parent(s): a0e0a21

Update eda.py

Files changed (1) hide show

eda.py CHANGED Viewed

@@ -21,14 +21,6 @@ def process_review(review):
     review = re.sub(r'[^a-z\s]', '', review) # Remove non-alphabetical characters
     return review
-def find_review_column(data):
-    """Attempt to identify the review column from the dataset."""
-    potential_columns = ['review', 'text', 'comment', 'message', 'description']
-    for col in potential_columns:
-        if col in data.columns:
-            return col
-    return None
 def display_eda(data):
     # Derive the 'sentiment' column from 'rating' if it doesn't exist
     if 'sentiment' not in data.columns:
@@ -50,16 +42,11 @@ def display_eda(data):
     # Word cloud for each sentiment
     st.subheader("Word Clouds for Sentiments")
-    review_column = find_review_column(data)
-    if not review_column:
-        st.error("Couldn't find a column with reviews. Please check the dataset.")
-        return
     sentiments = data['sentiment'].unique()
     for sentiment in sentiments:
         st.write(f"Word Cloud for {sentiment}")
         subset = data[data['sentiment'] == sentiment]
-        text = " ".join(process_review(review) for review in subset[review_column])
         wordcloud = WordCloud(max_words=100, background_color="white").generate(text)
         plt.figure()
         plt.imshow(wordcloud, interpolation="bilinear")

     review = re.sub(r'[^a-z\s]', '', review) # Remove non-alphabetical characters
     return review
 def display_eda(data):
     # Derive the 'sentiment' column from 'rating' if it doesn't exist
     if 'sentiment' not in data.columns:
     # Word cloud for each sentiment
     st.subheader("Word Clouds for Sentiments")
     sentiments = data['sentiment'].unique()
     for sentiment in sentiments:
         st.write(f"Word Cloud for {sentiment}")
         subset = data[data['sentiment'] == sentiment]
+        text = " ".join(process_review(review) for review in subset['review_description'])
         wordcloud = WordCloud(max_words=100, background_color="white").generate(text)
         plt.figure()
         plt.imshow(wordcloud, interpolation="bilinear")