de-Rodrigo commited on
Commit
2a17f9e
1 Parent(s): fe0bf0b
Files changed (1) hide show
  1. app.py +15 -14
app.py CHANGED
@@ -564,7 +564,8 @@ def compute_global_regression(df_combined, embedding_cols, tsne_params, df_f1, r
564
  perplexity=tsne_params["perplexity"],
565
  learning_rate=tsne_params["learning_rate"])
566
 
567
- reduced = reducer.fit_transform(df_combined[embedding_cols].values)
 
568
  # Guardamos el embedding completo (por ejemplo, 4 dimensiones en PCA)
569
  df_combined['embedding'] = list(reduced)
570
  # Si el embedding es 2D, asignamos x e y para visualizaci贸n
@@ -580,10 +581,10 @@ def compute_global_regression(df_combined, embedding_cols, tsne_params, df_f1, r
580
  cont = None
581
  silhouette = None
582
 
583
- # if reduction_method in ("t-SNE","PCA"):
584
- # X = df_combined[embedding_cols].values
585
- # trust = trustworthiness(X, reduced, n_neighbors=TSNE_NEIGHBOURS)
586
- # cont = compute_continuity(X, reduced, n_neighbors=TSNE_NEIGHBOURS)
587
 
588
  # silhouette_clustering = DBSCAN(eps=0.1, min_samples=15).fit(reduced)
589
  # silhouette_labels = silhouette_clustering.labels_
@@ -594,16 +595,16 @@ def compute_global_regression(df_combined, embedding_cols, tsne_params, df_f1, r
594
  # else:
595
  # silhouette = -1
596
 
597
- df_heat = pd.read_csv(f"data/heatmaps_donut.csv")
598
- feature_options = [col for col in df_heat.columns if col != "name"]
599
-
600
- silhouette_vals = []
601
- for feature in feature_options:
602
- labels = df_heat[feature].values
603
- silhouette = silhouette_score(reduced, labels)
604
- silhouette_vals.append(silhouette)
605
 
606
- silhouette = np.mean(silhouette_vals)
607
 
608
  dfs_reduced, unique_subsets = split_versions(df_combined, reduced)
609
 
 
564
  perplexity=tsne_params["perplexity"],
565
  learning_rate=tsne_params["learning_rate"])
566
 
567
+ # reduced = reducer.fit_transform(df_combined[embedding_cols].values)
568
+ reduced = reducer.fit_transform(df_combined[df_combined["version"] == "real"][embedding_cols].values)
569
  # Guardamos el embedding completo (por ejemplo, 4 dimensiones en PCA)
570
  df_combined['embedding'] = list(reduced)
571
  # Si el embedding es 2D, asignamos x e y para visualizaci贸n
 
581
  cont = None
582
  silhouette = None
583
 
584
+ if reduction_method in ("t-SNE","PCA"):
585
+ X = df_combined[embedding_cols].values
586
+ trust = trustworthiness(X, reduced, n_neighbors=TSNE_NEIGHBOURS)
587
+ cont = compute_continuity(X, reduced, n_neighbors=TSNE_NEIGHBOURS)
588
 
589
  # silhouette_clustering = DBSCAN(eps=0.1, min_samples=15).fit(reduced)
590
  # silhouette_labels = silhouette_clustering.labels_
 
595
  # else:
596
  # silhouette = -1
597
 
598
+ df_heat = pd.read_csv(f"data/heatmaps_donut.csv")
599
+ feature_options = [col for col in df_heat.columns if col != "name"]
600
+
601
+ silhouette_vals = []
602
+ for feature in feature_options:
603
+ labels = df_heat[feature].values
604
+ silhouette = silhouette_score(reduced, labels)
605
+ silhouette_vals.append(silhouette)
606
 
607
+ silhouette = np.mean(silhouette_vals)
608
 
609
  dfs_reduced, unique_subsets = split_versions(df_combined, reduced)
610