Spaces:
Running
Running
Auto-deploy from GitHub: 6396671754454c2d7731d18b21582eb005eb0004
Browse files- src/utils/dataset.py +5 -5
src/utils/dataset.py
CHANGED
|
@@ -115,12 +115,12 @@ def scale_pca(data: dict):
|
|
| 115 |
X_test_lyrics = ipca.transform(X_test_lyrics)
|
| 116 |
X_val_lyrics = ipca.transform(X_val_lyrics)
|
| 117 |
|
| 118 |
-
#
|
| 119 |
-
pca_lyric_scaler = StandardScaler().fit(X_train_lyrics)
|
| 120 |
|
| 121 |
-
X_train_lyrics = pca_lyric_scaler.transform(X_train_lyrics)
|
| 122 |
-
X_test_lyrics = pca_lyric_scaler.transform(X_test_lyrics)
|
| 123 |
-
X_val_lyrics = pca_lyric_scaler.transform(X_val_lyrics)
|
| 124 |
|
| 125 |
# Concatenate them back to their original form, but scaled
|
| 126 |
X_train = np.concatenate([X_train_audio, X_train_lyrics], axis=1)
|
|
|
|
| 115 |
X_test_lyrics = ipca.transform(X_test_lyrics)
|
| 116 |
X_val_lyrics = ipca.transform(X_val_lyrics)
|
| 117 |
|
| 118 |
+
# NOTE: Scaling after PCA produces underperforming models compared to non-scaling. One can toggle it on for experimentation/testing purposes.
|
| 119 |
+
#pca_lyric_scaler = StandardScaler().fit(X_train_lyrics)
|
| 120 |
|
| 121 |
+
#X_train_lyrics = pca_lyric_scaler.transform(X_train_lyrics)
|
| 122 |
+
#X_test_lyrics = pca_lyric_scaler.transform(X_test_lyrics)
|
| 123 |
+
#X_val_lyrics = pca_lyric_scaler.transform(X_val_lyrics)
|
| 124 |
|
| 125 |
# Concatenate them back to their original form, but scaled
|
| 126 |
X_train = np.concatenate([X_train_audio, X_train_lyrics], axis=1)
|