Update hyperparams.yaml
Browse files- hyperparams.yaml +9 -9
hyperparams.yaml
CHANGED
|
@@ -3,10 +3,10 @@
|
|
| 3 |
# yamllint disable
|
| 4 |
seed: 1101
|
| 5 |
__set_seed: !apply:speechbrain.utils.seed_everything [1101]
|
| 6 |
-
output_folder:
|
| 7 |
-
output_wer_folder:
|
| 8 |
-
save_folder:
|
| 9 |
-
train_log:
|
| 10 |
|
| 11 |
# Data files
|
| 12 |
data_folder: /mnt/data/commonvoice/uz # e.g, /localscratch/cv-corpus-5.1-2020-06-22/fr
|
|
@@ -17,9 +17,9 @@ test_tsv_file: /mnt/data/commonvoice/uz/test.tsv # Standard CommonVoice .tsv fil
|
|
| 17 |
unlabeled_tsv_file: audio_data_loader/dataloader/youtube_gcp.tsv # Path to the youtube dataset
|
| 18 |
accented_letters: false
|
| 19 |
language: uz # use 'it' for Italian, 'rw' for Kinyarwanda, 'en' for english
|
| 20 |
-
train_csv:
|
| 21 |
-
valid_csv:
|
| 22 |
-
test_csv:
|
| 23 |
unlabeled_csv: audio_data_loader/dataloader/unlabeled_ogg.csv # CREATE IN THE DIRECTORY
|
| 24 |
skip_prep: false # Skip data preparation
|
| 25 |
convert_to_wav: false # Switch this to True to convert all mp3 files to wav.
|
|
@@ -222,7 +222,7 @@ noam_annealing: &id009 !new:speechbrain.nnet.schedulers.NoamScheduler
|
|
| 222 |
n_warmup_steps: 1000
|
| 223 |
|
| 224 |
checkpointer: !new:speechbrain.utils.checkpoints.Checkpointer
|
| 225 |
-
checkpoints_dir:
|
| 226 |
recoverables:
|
| 227 |
model: *id008
|
| 228 |
noam_scheduler: *id009
|
|
@@ -271,7 +271,7 @@ compute_features: !new:speechbrain.lobes.features.Fbank
|
|
| 271 |
n_mels: 80
|
| 272 |
|
| 273 |
train_logger: !new:speechbrain.utils.train_logger.FileTrainLogger
|
| 274 |
-
save_file:
|
| 275 |
|
| 276 |
error_rate_computer: !name:speechbrain.utils.metric_stats.ErrorRateStats
|
| 277 |
acc_computer: !name:speechbrain.utils.Accuracy.AccuracyStats
|
|
|
|
| 3 |
# yamllint disable
|
| 4 |
seed: 1101
|
| 5 |
__set_seed: !apply:speechbrain.utils.seed_everything [1101]
|
| 6 |
+
output_folder: uz_transformer_4000/model_saved
|
| 7 |
+
output_wer_folder: uz_transformer_4000/model_saved/
|
| 8 |
+
save_folder: uz_transformer_4000/model_saved/save
|
| 9 |
+
train_log: uz_transformer_4000/model_saved/train_log.txt
|
| 10 |
|
| 11 |
# Data files
|
| 12 |
data_folder: /mnt/data/commonvoice/uz # e.g, /localscratch/cv-corpus-5.1-2020-06-22/fr
|
|
|
|
| 17 |
unlabeled_tsv_file: audio_data_loader/dataloader/youtube_gcp.tsv # Path to the youtube dataset
|
| 18 |
accented_letters: false
|
| 19 |
language: uz # use 'it' for Italian, 'rw' for Kinyarwanda, 'en' for english
|
| 20 |
+
train_csv: uz_transformer_4000/model_saved/train.csv
|
| 21 |
+
valid_csv: uz_transformer_4000/model_saved/dev.csv
|
| 22 |
+
test_csv: uz_transformer_4000/model_saved/test.csv
|
| 23 |
unlabeled_csv: audio_data_loader/dataloader/unlabeled_ogg.csv # CREATE IN THE DIRECTORY
|
| 24 |
skip_prep: false # Skip data preparation
|
| 25 |
convert_to_wav: false # Switch this to True to convert all mp3 files to wav.
|
|
|
|
| 222 |
n_warmup_steps: 1000
|
| 223 |
|
| 224 |
checkpointer: !new:speechbrain.utils.checkpoints.Checkpointer
|
| 225 |
+
checkpoints_dir: uz_transformer_4000/model_saved/save
|
| 226 |
recoverables:
|
| 227 |
model: *id008
|
| 228 |
noam_scheduler: *id009
|
|
|
|
| 271 |
n_mels: 80
|
| 272 |
|
| 273 |
train_logger: !new:speechbrain.utils.train_logger.FileTrainLogger
|
| 274 |
+
save_file: uz_transformer_4000/model_saved/train_log.txt
|
| 275 |
|
| 276 |
error_rate_computer: !name:speechbrain.utils.metric_stats.ErrorRateStats
|
| 277 |
acc_computer: !name:speechbrain.utils.Accuracy.AccuracyStats
|