tanish78 commited on
Commit
3594f61
·
verified ·
1 Parent(s): d14f22e

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +6 -1
app.py CHANGED
@@ -173,17 +173,22 @@ def main(file, num_categories_to_display):
173
  category_sizes = df['Category'].value_counts().reset_index()
174
  category_sizes.columns = ['Category', 'Count']
175
  sorted_categories = category_sizes.sort_values(by='Count', ascending=False)['Category'].tolist()
 
 
176
 
177
  # Get the largest x categories as specified by num_categories_to_display
178
  largest_categories = sorted_categories[:num_categories_to_display]
 
179
 
180
  # Filter the dataframe to include only the largest categories
181
  filtered_df = df[df['Category'].isin(largest_categories)]
 
182
 
183
  # Sort the dataframe by Category
184
  filtered_df = filtered_df.sort_values(by='Category')
 
185
 
186
- wordcloud_img = generate_wordcloud(filtered_df) # Word cloud based on the entire dataframe
187
  bar_chart_img = generate_bar_chart(df, num_categories_to_display) # Bar chart based on the filtered dataframe
188
 
189
  with tempfile.NamedTemporaryFile(delete=False, suffix=".csv") as tmpfile:
 
173
  category_sizes = df['Category'].value_counts().reset_index()
174
  category_sizes.columns = ['Category', 'Count']
175
  sorted_categories = category_sizes.sort_values(by='Count', ascending=False)['Category'].tolist()
176
+ sorted_categories_sm = category_sizes.sort_values(by='Count', ascending=False)['Category'].tolist()
177
+
178
 
179
  # Get the largest x categories as specified by num_categories_to_display
180
  largest_categories = sorted_categories[:num_categories_to_display]
181
+ smallest_categories = sorted_categories_sm[:num_categories_to_display]
182
 
183
  # Filter the dataframe to include only the largest categories
184
  filtered_df = df[df['Category'].isin(largest_categories)]
185
+ filtered_cloud_df = df[df['Category'].isin(smallest_categories)]
186
 
187
  # Sort the dataframe by Category
188
  filtered_df = filtered_df.sort_values(by='Category')
189
+ filtered_cloud_df = filtered_cloud_df.sort_values(by='Category')
190
 
191
+ wordcloud_img = generate_wordcloud(filtered_cloud_df) # Word cloud based on the entire dataframe
192
  bar_chart_img = generate_bar_chart(df, num_categories_to_display) # Bar chart based on the filtered dataframe
193
 
194
  with tempfile.NamedTemporaryFile(delete=False, suffix=".csv") as tmpfile: