Update hyperparams.yaml
Browse files- hyperparams.yaml +12 -7
hyperparams.yaml
CHANGED
|
@@ -22,10 +22,10 @@ n_mels: 80
|
|
| 22 |
out_n_neurons: 50
|
| 23 |
|
| 24 |
# embedding_model: !new:custom_models.Conv2dEncoder_v2
|
| 25 |
-
embedding_model:
|
| 26 |
dim: 256
|
| 27 |
|
| 28 |
-
classifier:
|
| 29 |
input_size: 256
|
| 30 |
out_neurons: 50
|
| 31 |
lin_blocks: 1
|
|
@@ -38,25 +38,30 @@ n_fft: 1024
|
|
| 38 |
spec_mag_power: 0.5
|
| 39 |
hop_length: 11.6099
|
| 40 |
win_length: 23.2199
|
| 41 |
-
compute_stft:
|
| 42 |
n_fft: 1024
|
| 43 |
hop_length: 11.6099
|
| 44 |
win_length: 23.2199
|
| 45 |
sample_rate: 16000
|
| 46 |
|
| 47 |
-
compute_fbank:
|
| 48 |
n_mels: 80
|
| 49 |
n_fft: 1024
|
| 50 |
sample_rate: 16000
|
| 51 |
|
| 52 |
-
compute_istft:
|
| 53 |
sample_rate: 16000
|
| 54 |
hop_length: 11.6099
|
| 55 |
win_length: 23.2199
|
| 56 |
|
| 57 |
label_encoder: !new:speechbrain.dataio.encoder.CategoricalEncoder
|
| 58 |
-
psi_model:
|
| 59 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 60 |
|
| 61 |
modules:
|
| 62 |
compute_stft: !ref <compute_stft>
|
|
|
|
| 22 |
out_n_neurons: 50
|
| 23 |
|
| 24 |
# embedding_model: !new:custom_models.Conv2dEncoder_v2
|
| 25 |
+
embedding_model: !new:speechbrain.lobes.models.PIQ.Conv2dEncoder_v2
|
| 26 |
dim: 256
|
| 27 |
|
| 28 |
+
classifier: !new:speechbrain.lobes.models.ECAPA_TDNN.Classifier
|
| 29 |
input_size: 256
|
| 30 |
out_neurons: 50
|
| 31 |
lin_blocks: 1
|
|
|
|
| 38 |
spec_mag_power: 0.5
|
| 39 |
hop_length: 11.6099
|
| 40 |
win_length: 23.2199
|
| 41 |
+
compute_stft: !new:speechbrain.processing.features.STFT
|
| 42 |
n_fft: 1024
|
| 43 |
hop_length: 11.6099
|
| 44 |
win_length: 23.2199
|
| 45 |
sample_rate: 16000
|
| 46 |
|
| 47 |
+
compute_fbank: !new:speechbrain.processing.features.Filterbank
|
| 48 |
n_mels: 80
|
| 49 |
n_fft: 1024
|
| 50 |
sample_rate: 16000
|
| 51 |
|
| 52 |
+
compute_istft: !new:speechbrain.processing.features.ISTFT
|
| 53 |
sample_rate: 16000
|
| 54 |
hop_length: 11.6099
|
| 55 |
win_length: 23.2199
|
| 56 |
|
| 57 |
label_encoder: !new:speechbrain.dataio.encoder.CategoricalEncoder
|
| 58 |
+
psi_model: !new:speechbrain.lobes.models.PIQ.VectorQuantizedPSI_Audio
|
| 59 |
+
dim: 256
|
| 60 |
+
K: 1024
|
| 61 |
+
shared_keys: 0
|
| 62 |
+
activate_class_partitioning: true
|
| 63 |
+
use_adapter: true
|
| 64 |
+
adapter_reduce_dim: true
|
| 65 |
|
| 66 |
modules:
|
| 67 |
compute_stft: !ref <compute_stft>
|