Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -342,31 +342,32 @@ def nlp_pipeline(original_df, console_messages):
|
|
| 342 |
print(f"Optimal clusters: {optimal_clusters}")
|
| 343 |
print(result_df.head())
|
| 344 |
# console_messages.append(f"Optimal clusters: {optimal_n_clusters}")
|
|
|
|
|
|
|
|
|
|
| 345 |
except Exception as e:
|
| 346 |
-
print(f"Error in extract_problem_domains: {e}")
|
| 347 |
-
|
|
|
|
|
|
|
| 348 |
|
| 349 |
|
| 350 |
# problem_clusters, problem_model = perform_clustering(processed_df['Problem_Description'], n_clusters=10)
|
| 351 |
# location_clusters, location_model = perform_clustering(processed_df['Geographical_Location'], n_clusters=5)
|
| 352 |
|
| 353 |
|
| 354 |
-
|
| 355 |
-
# return processed_df
|
| 356 |
-
return domain_df, console_messages
|
| 357 |
|
| 358 |
|
| 359 |
def process_excel(file):
|
| 360 |
console_messages = []
|
| 361 |
-
console_messages.append("Processing starts...")
|
| 362 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
| 363 |
try:
|
| 364 |
-
# Ensure the file path is correct
|
| 365 |
-
console_messages.append("Reading the uploaded Excel file...")
|
| 366 |
-
file_path = file.name if hasattr(file, 'name') else file
|
| 367 |
-
# Read the Excel file
|
| 368 |
-
df = pd.read_excel(file_path)
|
| 369 |
-
|
| 370 |
# Process the DataFrame
|
| 371 |
console_messages.append("Processing the DataFrame...")
|
| 372 |
result_df, console_messages = nlp_pipeline(df, console_messages)
|
|
|
|
| 342 |
print(f"Optimal clusters: {optimal_clusters}")
|
| 343 |
print(result_df.head())
|
| 344 |
# console_messages.append(f"Optimal clusters: {optimal_n_clusters}")
|
| 345 |
+
|
| 346 |
+
console_messages.append("NLP pipeline completed.")
|
| 347 |
+
return domain_df, console_messages
|
| 348 |
except Exception as e:
|
| 349 |
+
# print(f"Error in extract_problem_domains: {e}")
|
| 350 |
+
console_messages.append(f"Error in extract_problem_domains: {str(e)}")
|
| 351 |
+
# return processed_df, console_messages
|
| 352 |
+
return domain_df, console_messages
|
| 353 |
|
| 354 |
|
| 355 |
# problem_clusters, problem_model = perform_clustering(processed_df['Problem_Description'], n_clusters=10)
|
| 356 |
# location_clusters, location_model = perform_clustering(processed_df['Geographical_Location'], n_clusters=5)
|
| 357 |
|
| 358 |
|
| 359 |
+
|
|
|
|
|
|
|
| 360 |
|
| 361 |
|
| 362 |
def process_excel(file):
|
| 363 |
console_messages = []
|
| 364 |
+
console_messages.append("Processing starts. Reading the uploaded Excel file...")
|
| 365 |
+
# Ensure the file path is correct
|
| 366 |
+
file_path = file.name if hasattr(file, 'name') else file
|
| 367 |
+
# Read the Excel file
|
| 368 |
+
df = pd.read_excel(file_path)
|
| 369 |
+
|
| 370 |
try:
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 371 |
# Process the DataFrame
|
| 372 |
console_messages.append("Processing the DataFrame...")
|
| 373 |
result_df, console_messages = nlp_pipeline(df, console_messages)
|