tanish78 commited on
Commit
d32c31b
·
verified ·
1 Parent(s): 2d8cb02

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +6 -2
app.py CHANGED
@@ -173,18 +173,22 @@ def main(file, num_clusters_to_display):
173
  category_sizes = df['Category'].value_counts().reset_index()
174
  category_sizes.columns = ['Category', 'Count']
175
  sorted_categories = category_sizes.sort_values(by='Count', ascending=True)['Category'].tolist()
 
176
 
177
  # Get the largest x categories as specified by num_clusters_to_display
178
  largest_categories = sorted_categories[:num_clusters_to_display]
 
179
 
180
  # Filter the dataframe to include only the largest categories
181
  filtered_df = df[df['Category'].isin(largest_categories)]
 
182
 
183
  # Sort the dataframe by Category
184
  filtered_df = filtered_df.sort_values(by='Category')
 
185
 
186
- wordcloud_img = generate_wordcloud(filtered_df)
187
- bar_chart_img = generate_bar_chart(filtered_df, num_clusters_to_display)
188
 
189
  with tempfile.NamedTemporaryFile(delete=False, suffix=".csv") as tmpfile:
190
  filtered_df.to_csv(tmpfile.name, index=False)
 
173
  category_sizes = df['Category'].value_counts().reset_index()
174
  category_sizes.columns = ['Category', 'Count']
175
  sorted_categories = category_sizes.sort_values(by='Count', ascending=True)['Category'].tolist()
176
+ sorted_categories_sm = category_sizes.sort_values(by='Count', ascending=False)['Category'].tolist()
177
 
178
  # Get the largest x categories as specified by num_clusters_to_display
179
  largest_categories = sorted_categories[:num_clusters_to_display]
180
+ smallest_categories = sorted_categories_sm[:num_clusters_to_display]
181
 
182
  # Filter the dataframe to include only the largest categories
183
  filtered_df = df[df['Category'].isin(largest_categories)]
184
+ filtered_cloud_df = df[df['Category'].isin(smallest_categories)]
185
 
186
  # Sort the dataframe by Category
187
  filtered_df = filtered_df.sort_values(by='Category')
188
+ filtered_cloud_df = filtered_cloud_df.sort_values(by='Category')
189
 
190
+ wordcloud_img = generate_wordcloud(filtered_cloud_df)
191
+ bar_chart_img = generate_bar_chart(df, num_clusters_to_display)
192
 
193
  with tempfile.NamedTemporaryFile(delete=False, suffix=".csv") as tmpfile:
194
  filtered_df.to_csv(tmpfile.name, index=False)