de-Rodrigo commited on
Commit
d967697
·
1 Parent(s): 79df3f5

Rescale PCA output

Browse files
Files changed (1) hide show
  1. app.py +6 -0
app.py CHANGED
@@ -8,6 +8,7 @@ from bokeh.palettes import Reds9, Blues9, Oranges9, Purples9, Greys9, BuGn9, Gre
8
  from sklearn.decomposition import PCA
9
  from sklearn.manifold import TSNE, trustworthiness
10
  from sklearn.metrics import pairwise_distances
 
11
  import io
12
  import ot
13
  from sklearn.linear_model import LinearRegression
@@ -456,6 +457,8 @@ def compute_global_regression(df_combined, embedding_cols, tsne_params, df_f1, r
456
  learning_rate=tsne_params["learning_rate"])
457
 
458
  reduced = reducer.fit_transform(df_combined[embedding_cols].values)
 
 
459
  # Guardamos el embedding completo (por ejemplo, 4 dimensiones en PCA)
460
  df_combined['embedding'] = list(reduced)
461
  # Si el embedding es 2D, asignamos x e y para visualización
@@ -790,6 +793,9 @@ def run_model(model_name):
790
  df_real_only = embeddings["real"].copy()
791
  pca_real = PCA(n_components=N_COMPONENTS)
792
  reduced_real = pca_real.fit_transform(df_real_only[embedding_cols].values)
 
 
 
793
 
794
  # Agregar columnas PC1, PC2, … a df_real_only
795
  for i in range(reduced_real.shape[1]):
 
8
  from sklearn.decomposition import PCA
9
  from sklearn.manifold import TSNE, trustworthiness
10
  from sklearn.metrics import pairwise_distances
11
+ from sklearn.preprocessing import MinMaxScaler
12
  import io
13
  import ot
14
  from sklearn.linear_model import LinearRegression
 
457
  learning_rate=tsne_params["learning_rate"])
458
 
459
  reduced = reducer.fit_transform(df_combined[embedding_cols].values)
460
+ scaler = MinMaxScaler(feature_range=(-1, 1))
461
+ reduced = scaler.fit_transform(reduced)
462
  # Guardamos el embedding completo (por ejemplo, 4 dimensiones en PCA)
463
  df_combined['embedding'] = list(reduced)
464
  # Si el embedding es 2D, asignamos x e y para visualización
 
793
  df_real_only = embeddings["real"].copy()
794
  pca_real = PCA(n_components=N_COMPONENTS)
795
  reduced_real = pca_real.fit_transform(df_real_only[embedding_cols].values)
796
+
797
+ scaler_real = MinMaxScaler(feature_range=(-1, 1))
798
+ reduced_real = scaler_real.fit_transform(reduced_real)
799
 
800
  # Agregar columnas PC1, PC2, … a df_real_only
801
  for i in range(reduced_real.shape[1]):