Spaces:
Sleeping
Sleeping
Commit
路
2a17f9e
1
Parent(s):
fe0bf0b
Test
Browse files
app.py
CHANGED
|
@@ -564,7 +564,8 @@ def compute_global_regression(df_combined, embedding_cols, tsne_params, df_f1, r
|
|
| 564 |
perplexity=tsne_params["perplexity"],
|
| 565 |
learning_rate=tsne_params["learning_rate"])
|
| 566 |
|
| 567 |
-
reduced = reducer.fit_transform(df_combined[embedding_cols].values)
|
|
|
|
| 568 |
# Guardamos el embedding completo (por ejemplo, 4 dimensiones en PCA)
|
| 569 |
df_combined['embedding'] = list(reduced)
|
| 570 |
# Si el embedding es 2D, asignamos x e y para visualizaci贸n
|
|
@@ -580,10 +581,10 @@ def compute_global_regression(df_combined, embedding_cols, tsne_params, df_f1, r
|
|
| 580 |
cont = None
|
| 581 |
silhouette = None
|
| 582 |
|
| 583 |
-
|
| 584 |
-
|
| 585 |
-
|
| 586 |
-
|
| 587 |
|
| 588 |
# silhouette_clustering = DBSCAN(eps=0.1, min_samples=15).fit(reduced)
|
| 589 |
# silhouette_labels = silhouette_clustering.labels_
|
|
@@ -594,16 +595,16 @@ def compute_global_regression(df_combined, embedding_cols, tsne_params, df_f1, r
|
|
| 594 |
# else:
|
| 595 |
# silhouette = -1
|
| 596 |
|
| 597 |
-
|
| 598 |
-
|
| 599 |
-
|
| 600 |
-
|
| 601 |
-
|
| 602 |
-
|
| 603 |
-
|
| 604 |
-
|
| 605 |
|
| 606 |
-
|
| 607 |
|
| 608 |
dfs_reduced, unique_subsets = split_versions(df_combined, reduced)
|
| 609 |
|
|
|
|
| 564 |
perplexity=tsne_params["perplexity"],
|
| 565 |
learning_rate=tsne_params["learning_rate"])
|
| 566 |
|
| 567 |
+
# reduced = reducer.fit_transform(df_combined[embedding_cols].values)
|
| 568 |
+
reduced = reducer.fit_transform(df_combined[df_combined["version"] == "real"][embedding_cols].values)
|
| 569 |
# Guardamos el embedding completo (por ejemplo, 4 dimensiones en PCA)
|
| 570 |
df_combined['embedding'] = list(reduced)
|
| 571 |
# Si el embedding es 2D, asignamos x e y para visualizaci贸n
|
|
|
|
| 581 |
cont = None
|
| 582 |
silhouette = None
|
| 583 |
|
| 584 |
+
if reduction_method in ("t-SNE","PCA"):
|
| 585 |
+
X = df_combined[embedding_cols].values
|
| 586 |
+
trust = trustworthiness(X, reduced, n_neighbors=TSNE_NEIGHBOURS)
|
| 587 |
+
cont = compute_continuity(X, reduced, n_neighbors=TSNE_NEIGHBOURS)
|
| 588 |
|
| 589 |
# silhouette_clustering = DBSCAN(eps=0.1, min_samples=15).fit(reduced)
|
| 590 |
# silhouette_labels = silhouette_clustering.labels_
|
|
|
|
| 595 |
# else:
|
| 596 |
# silhouette = -1
|
| 597 |
|
| 598 |
+
df_heat = pd.read_csv(f"data/heatmaps_donut.csv")
|
| 599 |
+
feature_options = [col for col in df_heat.columns if col != "name"]
|
| 600 |
+
|
| 601 |
+
silhouette_vals = []
|
| 602 |
+
for feature in feature_options:
|
| 603 |
+
labels = df_heat[feature].values
|
| 604 |
+
silhouette = silhouette_score(reduced, labels)
|
| 605 |
+
silhouette_vals.append(silhouette)
|
| 606 |
|
| 607 |
+
silhouette = np.mean(silhouette_vals)
|
| 608 |
|
| 609 |
dfs_reduced, unique_subsets = split_versions(df_combined, reduced)
|
| 610 |
|