krislette commited on
Commit
11a030b
·
1 Parent(s): 568ba48

Auto-deploy from GitHub: 6396671754454c2d7731d18b21582eb005eb0004

Browse files
Files changed (1) hide show
  1. src/utils/dataset.py +5 -5
src/utils/dataset.py CHANGED
@@ -115,12 +115,12 @@ def scale_pca(data: dict):
115
  X_test_lyrics = ipca.transform(X_test_lyrics)
116
  X_val_lyrics = ipca.transform(X_val_lyrics)
117
 
118
- # Apply scaler to the PCA output
119
- pca_lyric_scaler = StandardScaler().fit(X_train_lyrics)
120
 
121
- X_train_lyrics = pca_lyric_scaler.transform(X_train_lyrics)
122
- X_test_lyrics = pca_lyric_scaler.transform(X_test_lyrics)
123
- X_val_lyrics = pca_lyric_scaler.transform(X_val_lyrics)
124
 
125
  # Concatenate them back to their original form, but scaled
126
  X_train = np.concatenate([X_train_audio, X_train_lyrics], axis=1)
 
115
  X_test_lyrics = ipca.transform(X_test_lyrics)
116
  X_val_lyrics = ipca.transform(X_val_lyrics)
117
 
118
+ # NOTE: Scaling after PCA produces underperforming models compared to non-scaling. One can toggle it on for experimentation/testing purposes.
119
+ #pca_lyric_scaler = StandardScaler().fit(X_train_lyrics)
120
 
121
+ #X_train_lyrics = pca_lyric_scaler.transform(X_train_lyrics)
122
+ #X_test_lyrics = pca_lyric_scaler.transform(X_test_lyrics)
123
+ #X_val_lyrics = pca_lyric_scaler.transform(X_val_lyrics)
124
 
125
  # Concatenate them back to their original form, but scaled
126
  X_train = np.concatenate([X_train_audio, X_train_lyrics], axis=1)