Spaces:

SantanuBanerjee
/

TaxDirection

Sleeping

App Files Files Community

SantanuBanerjee commited on Aug 7, 2024

Commit

6ec568e

verified ·

1 Parent(s): 6682e9f

Update app.py

Browse files

Files changed (1) hide show

app.py +28 -13

app.py CHANGED Viewed

@@ -584,8 +584,8 @@ def nlp_pipeline(original_df):
     print("Clustering Done...")
     # return processed_df, budget_cluster_df, problem_cluster_df, location_clusters, problem_clusters
-    print("\n location_clusters_1: ", location_clusters)
-    print("\n problem_clusters_1: ", problem_clusters)
     # # Generate project proposals
     # location_clusters = dict(enumerate(processed_df['Location_Category_Words'].unique()))
     # problem_clusters = dict(enumerate(processed_df['Problem_Category_Words'].unique()))
@@ -698,20 +698,35 @@ def process_excel(file):
                 consoleMessage_and_Print("Error during Project Proposal excelling at the end")
-            # Ensure location_clusters and problem_clusters are in DataFrame format
-            if isinstance(location_clusters, pd.DataFrame):
-                location_clusters.to_excel(writer, sheet_name='Location_Clusters', index=False)
-            else:
-                consoleMessage_and_Print("Converting Location Clusters to df")
-                pd.DataFrame(location_clusters).to_excel(writer, sheet_name='Location_Clusters', index=False)
-            if isinstance(problem_clusters, pd.DataFrame):
-                problem_clusters.to_excel(writer, sheet_name='Problem_Clusters', index=False)
-            else:
-                consoleMessage_and_Print("Converting Problem Clusters to df")
-                pd.DataFrame(problem_clusters).to_excel(writer, sheet_name='Problem_Clusters', index=False)

     print("Clustering Done...")
     # return processed_df, budget_cluster_df, problem_cluster_df, location_clusters, problem_clusters
+    print("\n location_clusters: ", location_clusters)
+    print("\n problem_clusters: ", problem_clusters)
     # # Generate project proposals
     # location_clusters = dict(enumerate(processed_df['Location_Category_Words'].unique()))
     # problem_clusters = dict(enumerate(processed_df['Problem_Category_Words'].unique()))
                 consoleMessage_and_Print("Error during Project Proposal excelling at the end")
+            try:
+                location_clusters_df = pd.DataFrame({'Cluster_Id': list(location_clusters.keys()),
+                                                     'Location_Cluster': list(location_clusters.values())})
+                location_clusters_df.to_excel(writer, sheet_name='Location_Clusters', index=False)
+            except error:
+                consoleMessage_and_Print("Error during Location Cluster Dataframing")
+            try:
+                problem_clusters_df = pd.DataFrame({'Cluster_Id': list(location_clusters.keys()),
+                                                    'Problem_Cluster': list(location_clusters.values())})
+                problem_clusters_df.to_excel(writer, sheet_name='Problem_Clusters', index=False)
+            except error:
+                consoleMessage_and_Print("Error during Problem Cluster Dataframing")
+            # # Ensure location_clusters and problem_clusters are in DataFrame format
+            # if isinstance(location_clusters, pd.DataFrame):
+            #     location_clusters.to_excel(writer, sheet_name='Location_Clusters', index=False)
+            # else:
+            #     consoleMessage_and_Print("Converting Location Clusters to df")
+            #     pd.DataFrame(location_clusters).to_excel(writer, sheet_name='Location_Clusters', index=False)
+            # if isinstance(problem_clusters, pd.DataFrame):
+            #     problem_clusters.to_excel(writer, sheet_name='Problem_Clusters', index=False)
+            # else:
+            #     consoleMessage_and_Print("Converting Problem Clusters to df")
+            #     pd.DataFrame(problem_clusters).to_excel(writer, sheet_name='Problem_Clusters', index=False)