Iliass Lasri commited on
Commit
7af5906
·
1 Parent(s): c3827e3

add examples cong

Browse files
Files changed (1) hide show
  1. config.yaml +74 -0
config.yaml ADDED
@@ -0,0 +1,74 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ training:
2
+ run_name: example_config
3
+ epochs: 150
4
+ learning_rate: 0.0001
5
+ log_interval: 100
6
+ checkpoint_dir: null
7
+ resume_from: null
8
+ n_iterative_pseudolabeling: 3
9
+ lr_scheduler:
10
+ _target_: torch.optim.lr_scheduler.CosineAnnealingLR
11
+ T_max: ${training.epochs}
12
+ eta_min: 1.0e-06
13
+ lr_scheduler_start_epoch: -1
14
+ dataset:
15
+ root: data/LibriSpeech
16
+ train_split: train-clean-100
17
+ test_split: test-clean
18
+ batch_size: 32
19
+ num_workers: 1
20
+ noise_dir: noise_fullband
21
+ max_audio_length: 160000
22
+ augmentations:
23
+ max_augs: 4 # in all our experiments we used 4
24
+ time_stretch: true
25
+ pitch_shift: true
26
+ reverberation: true
27
+ noise: true
28
+ rir_dir: data/rirs
29
+ activate_extra_augs: true
30
+ echo:
31
+ enabled: true
32
+ volume_range:
33
+ - 0.1
34
+ - 0.5
35
+ duration_range:
36
+ - 0.1
37
+ - 0.5
38
+ random_noise:
39
+ enabled: true
40
+ noise_std: 0.001
41
+ pink_noise:
42
+ enabled: true
43
+ noise_std: 0.01
44
+ lowpass_filter:
45
+ enabled: true
46
+ cutoff_freq: 5000
47
+ highpass_filter:
48
+ enabled: true
49
+ cutoff_freq: 500
50
+ bandpass_filter:
51
+ enabled: true
52
+ cutoff_freq_low: 300
53
+ cutoff_freq_high: 8000
54
+ smooth:
55
+ enabled: true
56
+ window_size_range:
57
+ - 2
58
+ - 10
59
+ boost_audio:
60
+ enabled: true
61
+ amount: 20
62
+ duck_audio:
63
+ enabled: true
64
+ amount: 20
65
+ updownresample:
66
+ enabled: true
67
+ intermediate_freq: 32000
68
+ model:
69
+ name: hubert-base-ls960
70
+ layer: 6
71
+ vocab_size: 500
72
+ kind_kmeans: kmeans
73
+ quantizer:
74
+ hidden_dim: 256