NickolayFM commited on
Commit
08276da
·
verified ·
1 Parent(s): 50921f6

Upload logs

Browse files
Files changed (2) hide show
  1. config.yaml +101 -0
  2. info.log +0 -0
config.yaml ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ _target_: src.model.ConformerModel
3
+ input_dim: 128
4
+ writer:
5
+ _target_: src.logger.CometMLWriter
6
+ project_name: pytorch_template_asr_example
7
+ workspace: null
8
+ run_name: conformer_30m
9
+ mode: online
10
+ loss_names:
11
+ - loss
12
+ log_checkpoints: false
13
+ id_length: 32
14
+ run_id: m2guzao93o9ytjxogwt78mftkyiqalsf
15
+ metrics:
16
+ train: []
17
+ inference:
18
+ - _target_: src.metrics.ArgmaxCERMetric
19
+ name: CER_(Argmax)
20
+ - _target_: src.metrics.ArgmaxWERMetric
21
+ name: WER_(Argmax)
22
+ - _target_: src.metrics.WER
23
+ name: WER
24
+ - _target_: src.metrics.CER
25
+ name: CER
26
+ datasets:
27
+ train:
28
+ _target_: src.datasets.LibrispeechDataset
29
+ part: train-other-500
30
+ instance_transforms: ${transforms.instance_transforms.train}
31
+ val:
32
+ _target_: src.datasets.LibrispeechDataset
33
+ part: test-clean
34
+ instance_transforms: ${transforms.instance_transforms.inference}
35
+ test:
36
+ _target_: src.datasets.LibrispeechDataset
37
+ part: test-other
38
+ instance_transforms: ${transforms.instance_transforms.inference}
39
+ dataloader:
40
+ _target_: torch.utils.data.DataLoader
41
+ batch_size: 30
42
+ num_workers: 2
43
+ pin_memory: true
44
+ transforms:
45
+ instance_transforms:
46
+ train:
47
+ get_spectrogram:
48
+ _target_: torchaudio.transforms.MelSpectrogram
49
+ sample_rate: 16000
50
+ audio:
51
+ _target_: torchvision.transforms.v2.Compose
52
+ transforms:
53
+ - _target_: src.transforms.wav_augs.Gain
54
+ sample_rate: 16000
55
+ min_gain_in_db: -6
56
+ max_gain_in_db: 6
57
+ p: 0.2
58
+ - _target_: src.transforms.wav_augs.Shift
59
+ p: 0.2
60
+ - _target_: src.transforms.wav_augs.PitchShift
61
+ min_semitones: -2
62
+ max_semitones: 2
63
+ p: 0.2
64
+ - _target_: src.transforms.wav_augs.Noise
65
+ p: 0.3
66
+ inference:
67
+ get_spectrogram:
68
+ _target_: torchaudio.transforms.MelSpectrogram
69
+ sample_rate: 16000
70
+ batch_transforms:
71
+ train: null
72
+ inference: null
73
+ optimizer:
74
+ _target_: torch.optim.AdamW
75
+ lr: 5.0e-05
76
+ lr_scheduler:
77
+ _target_: torch.optim.lr_scheduler.OneCycleLR
78
+ max_lr: 0.0001
79
+ pct_start: 0.1
80
+ steps_per_epoch: ${trainer.epoch_len}
81
+ epochs: ${trainer.n_epochs}
82
+ anneal_strategy: cos
83
+ loss_function:
84
+ _target_: src.loss.CTCLossWrapper
85
+ text_encoder:
86
+ _target_: src.text_encoder.CTCTextEncoder
87
+ trainer:
88
+ log_step: 200
89
+ n_epochs: 150
90
+ epoch_len: 1300
91
+ device_tensors:
92
+ - spectrogram
93
+ - text_encoded
94
+ resume_from: checkpoint-epoch62.pth
95
+ device: auto
96
+ override: false
97
+ monitor: min val_WER_(Argmax)
98
+ save_period: 5
99
+ early_stop: ${trainer.n_epochs}
100
+ save_dir: saved
101
+ seed: 1
info.log ADDED
The diff for this file is too large to render. See raw diff