Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -458,17 +458,17 @@ def nlp_pipeline(original_df):
|
|
| 458 |
|
| 459 |
|
| 460 |
|
| 461 |
-
|
| 462 |
-
# Create cluster dataframes
|
| 463 |
-
budget_cluster_df, problem_cluster_df = create_cluster_dataframes(processed_df)
|
| 464 |
|
| 465 |
-
# # Generate project proposals
|
| 466 |
-
# location_clusters = dict(enumerate(processed_df['Location_Category_Words'].unique()))
|
| 467 |
-
# problem_clusters = dict(enumerate(processed_df['Problem_Category_Words'].unique()))
|
| 468 |
-
project_proposals = create_project_proposals(budget_cluster_df, problem_cluster_df, location_clusters, problem_clusters)
|
| 469 |
|
| 470 |
-
console_messages.append("NLP pipeline completed.")
|
| 471 |
-
return processed_df, budget_cluster_df, problem_cluster_df, project_proposals, location_clusters, problem_clusters
|
| 472 |
|
| 473 |
|
| 474 |
|
|
@@ -488,7 +488,8 @@ def process_excel(file):
|
|
| 488 |
try:
|
| 489 |
# Process the DataFrame
|
| 490 |
console_messages.append("Processing the DataFrame...")
|
| 491 |
-
processed_df, budget_cluster_df, problem_cluster_df, project_proposals, location_clusters, problem_clusters = nlp_pipeline(df)
|
|
|
|
| 492 |
|
| 493 |
output_filename = "OutPut_PPs.xlsx"
|
| 494 |
with pd.ExcelWriter(output_filename) as writer:
|
|
|
|
| 458 |
|
| 459 |
|
| 460 |
|
| 461 |
+
return processed_df
|
| 462 |
+
# # Create cluster dataframes
|
| 463 |
+
# budget_cluster_df, problem_cluster_df = create_cluster_dataframes(processed_df)
|
| 464 |
|
| 465 |
+
# # # Generate project proposals
|
| 466 |
+
# # location_clusters = dict(enumerate(processed_df['Location_Category_Words'].unique()))
|
| 467 |
+
# # problem_clusters = dict(enumerate(processed_df['Problem_Category_Words'].unique()))
|
| 468 |
+
# project_proposals = create_project_proposals(budget_cluster_df, problem_cluster_df, location_clusters, problem_clusters)
|
| 469 |
|
| 470 |
+
# console_messages.append("NLP pipeline completed.")
|
| 471 |
+
# return processed_df, budget_cluster_df, problem_cluster_df, project_proposals, location_clusters, problem_clusters
|
| 472 |
|
| 473 |
|
| 474 |
|
|
|
|
| 488 |
try:
|
| 489 |
# Process the DataFrame
|
| 490 |
console_messages.append("Processing the DataFrame...")
|
| 491 |
+
# processed_df, budget_cluster_df, problem_cluster_df, project_proposals, location_clusters, problem_clusters = nlp_pipeline(df)
|
| 492 |
+
processed_df = nlp_pipeline(df)
|
| 493 |
|
| 494 |
output_filename = "OutPut_PPs.xlsx"
|
| 495 |
with pd.ExcelWriter(output_filename) as writer:
|