Spaces:

SantanuBanerjee
/

TaxDirection

Sleeping

App Files Files Community

SantanuBanerjee commited on Aug 6, 2024

Commit

f80d2db

verified ·

1 Parent(s): 2fbc9fe

Update app.py

Browse files

Files changed (1) hide show

app.py +17 -3

app.py CHANGED Viewed

@@ -462,7 +462,7 @@ def nlp_pipeline(original_df):
     # Create cluster dataframes
     budget_cluster_df, problem_cluster_df = create_cluster_dataframes(processed_df)
-    return processed_df, budget_cluster_df
     # # # Generate project proposals
     # # location_clusters = dict(enumerate(processed_df['Location_Category_Words'].unique()))
@@ -491,7 +491,7 @@ def process_excel(file):
         # Process the DataFrame
         console_messages.append("Processing the DataFrame...")
         # processed_df, budget_cluster_df, problem_cluster_df, project_proposals, location_clusters, problem_clusters = nlp_pipeline(df)
-        processed_df , budget_cluster_df = nlp_pipeline(df)
         output_filename = "OutPut_PPs.xlsx"
         with pd.ExcelWriter(output_filename) as writer:
@@ -502,9 +502,23 @@ def process_excel(file):
             # project_proposals_df.to_excel(writer, sheet_name='Project_Proposals', index=False)
             budget_cluster_df.to_excel(writer, sheet_name='Financial_Weights')
-            # problem_cluster_df.to_excel(writer, sheet_name='Problem_Descriptions')
             processed_df.to_excel(writer, sheet_name='Input_Processed', index=False)
         console_messages.append("Processing completed. Ready for download.")
         return output_filename, "\n".join(console_messages)  # Return the processed DataFrame as Excel file

     # Create cluster dataframes
     budget_cluster_df, problem_cluster_df = create_cluster_dataframes(processed_df)
+    return processed_df, budget_cluster_df, problem_cluster_df, location_clusters, problem_clusters
     # # # Generate project proposals
     # # location_clusters = dict(enumerate(processed_df['Location_Category_Words'].unique()))
         # Process the DataFrame
         console_messages.append("Processing the DataFrame...")
         # processed_df, budget_cluster_df, problem_cluster_df, project_proposals, location_clusters, problem_clusters = nlp_pipeline(df)
+        processed_df, budget_cluster_df, problem_cluster_df, location_clusters, problem_clusters  = nlp_pipeline(df)
         output_filename = "OutPut_PPs.xlsx"
         with pd.ExcelWriter(output_filename) as writer:
             # project_proposals_df.to_excel(writer, sheet_name='Project_Proposals', index=False)
             budget_cluster_df.to_excel(writer, sheet_name='Financial_Weights')
+            problem_cluster_df.to_excel(writer, sheet_name='Problem_Descriptions')
             processed_df.to_excel(writer, sheet_name='Input_Processed', index=False)
+            # Ensure location_clusters and problem_clusters are in DataFrame format
+            if isinstance(location_clusters, pd.DataFrame):
+                location_clusters.to_excel(writer, sheet_name='Location_Clusters', index=False)
+            else:
+                console_messages.append("Converting Location Clusters to df")
+                pd.DataFrame(location_clusters).to_excel(writer, sheet_name='Location_Clusters', index=False)
+            if isinstance(problem_clusters, pd.DataFrame):
+                problem_clusters.to_excel(writer, sheet_name='Problem_Clusters', index=False)
+            else:
+                console_messages.append("Converting Problem Clusters to df")
+                pd.DataFrame(problem_clusters).to_excel(writer, sheet_name='Problem_Clusters', index=False)
         console_messages.append("Processing completed. Ready for download.")
         return output_filename, "\n".join(console_messages)  # Return the processed DataFrame as Excel file