qingzhengwang commited on
Commit
01fb9cd
·
1 Parent(s): 8d8a4e7

Update config

Browse files
exp_combined/lid_mms_ecapa_upcon_32_44_it0.4_shared_trainable_raw/config.yaml CHANGED
@@ -1,11 +1,11 @@
1
- config: /work/nvme/bbjs/qwang20/espnet/egs2/lid_delta/lid1/conf/mms_1b_all_no_filter_balanced_dataset/mms_ecapa_upcon_32_44_it0.4_sharedCondProj_butUpdate_50k_lr1e-5_datasetup0.3_backup_33epoch.yaml
2
  print_config: false
3
  log_level: INFO
4
  drop_last_iter: false
5
  dry_run: false
6
  iterator_type: category
7
  valid_iterator_type: category
8
- output_dir: exp_all_no_filter_raw/spk_mms_ecapa_upcon_32_44_it0.4_sharedCondProj_butUpdate_50k_lr1e-5_datasetup0.3_backup_33epoch_raw
9
  ngpu: 1
10
  seed: 3702
11
  num_workers: 8
@@ -23,6 +23,8 @@ unused_parameters: true
23
  sharded_ddp: false
24
  use_deepspeed: false
25
  deepspeed_config: null
 
 
26
  cudnn_enabled: true
27
  cudnn_benchmark: true
28
  cudnn_deterministic: false
@@ -56,10 +58,10 @@ log_interval: 100
56
  use_matplotlib: true
57
  use_tensorboard: true
58
  create_graph_in_tensorboard: false
59
- use_wandb: true
60
- wandb_project: lid
61
  wandb_id: null
62
- wandb_entity: qingzhew-carnegie-mellon-university
63
  wandb_name: null
64
  wandb_model_log_interval: -1
65
  detect_anomaly: false
@@ -77,16 +79,18 @@ valid_batch_size: null
77
  batch_bins: 1440000
78
  valid_batch_bins: null
79
  category_sample_size: 10
80
- train_shape_file:
81
- - exp_all_no_filter_raw/spk_stats_16k/train/speech_shape
82
- valid_shape_file:
83
- - exp_all_no_filter_raw/spk_stats_16k/valid/speech_shape
84
- batch_type: catpow_balance_dataset
85
  upsampling_factor: 0.5
86
- language_upsampling_factor: 0.5
87
  dataset_upsampling_factor: 0.3
88
  dataset_scaling_factor: 1.2
89
  max_batch_size: 6
 
 
 
 
 
 
 
90
  valid_batch_type: null
91
  fold_length:
92
  - 120000
@@ -105,14 +109,14 @@ train_data_path_and_name_and_type:
105
  - - dump/raw/train_all_no_filter_lang/wav.scp
106
  - speech
107
  - sound
108
- - - dump/raw/train_all_no_filter_lang/utt2spk
109
  - lid_labels
110
  - text
111
  valid_data_path_and_name_and_type:
112
  - - dump/raw/dev_ml_superb2_lang/wav.scp
113
  - speech
114
  - sound
115
- - - dump/raw/dev_ml_superb2_lang/utt2spk
116
  - lid_labels
117
  - text
118
  multi_task_dataset: false
@@ -141,8 +145,8 @@ init: null
141
  use_preprocessor: true
142
  input_size: null
143
  target_duration: 3.0
144
- spk2utt: dump/raw/train_all_no_filter_lang/spk2utt
145
- spk_num: 157
146
  sample_rate: 16000
147
  num_eval: 10
148
  rir_scp: ''
@@ -153,19 +157,11 @@ model_conf:
153
  - 36
154
  - 40
155
  - 44
156
- lid_conditioning_layers: []
157
- frozen_ecapa: false
158
  apply_intermediate_lang2vec_loss: true
159
- apply_intermediate_lid_class_loss: false
160
  apply_intermediate_lang2vec_condition: true
161
- apply_intermediate_lid_class_condition: false
162
  inter_lang2vec_loss_weight: 0.4
163
- inter_lid_class_loss_weight: 0.0
164
  cutoff_gradient_from_backbone: false
165
- cutoff_gradient_before_condtrans: true
166
- independent_module: true
167
- use_gate: false
168
- gate_type: null
169
  shared_conditioning_proj: true
170
  frontend: s3prl_condition
171
  frontend_conf:
@@ -235,5 +231,5 @@ loss_conf:
235
  lang2vec_weight: 0.2
236
  required:
237
  - output_dir
238
- version: '202412'
239
  distributed: false
 
1
+ config: conf/combined/mms_ecapa_upcon_32_44_it0.4_shared_trainable_dev.yaml
2
  print_config: false
3
  log_level: INFO
4
  drop_last_iter: false
5
  dry_run: false
6
  iterator_type: category
7
  valid_iterator_type: category
8
+ output_dir: exp_combined/lid_mms_ecapa_upcon_32_44_it0.4_shared_trainable_dev_raw
9
  ngpu: 1
10
  seed: 3702
11
  num_workers: 8
 
23
  sharded_ddp: false
24
  use_deepspeed: false
25
  deepspeed_config: null
26
+ gradient_as_bucket_view: true
27
+ ddp_comm_hook: null
28
  cudnn_enabled: true
29
  cudnn_benchmark: true
30
  cudnn_deterministic: false
 
58
  use_matplotlib: true
59
  use_tensorboard: true
60
  create_graph_in_tensorboard: false
61
+ use_wandb: false
62
+ wandb_project: null
63
  wandb_id: null
64
+ wandb_entity: null
65
  wandb_name: null
66
  wandb_model_log_interval: -1
67
  detect_anomaly: false
 
79
  batch_bins: 1440000
80
  valid_batch_bins: null
81
  category_sample_size: 10
 
 
 
 
 
82
  upsampling_factor: 0.5
83
+ category_upsampling_factor: 0.5
84
  dataset_upsampling_factor: 0.3
85
  dataset_scaling_factor: 1.2
86
  max_batch_size: 6
87
+ min_batch_size: 1
88
+ train_shape_file:
89
+ - exp_combined/lid_stats_16k/train/speech_shape
90
+ valid_shape_file:
91
+ - exp_combined/lid_stats_16k/valid/speech_shape
92
+ batch_type: catpow_balance_dataset
93
+ language_upsampling_factor: 0.5
94
  valid_batch_type: null
95
  fold_length:
96
  - 120000
 
109
  - - dump/raw/train_all_no_filter_lang/wav.scp
110
  - speech
111
  - sound
112
+ - - dump/raw/train_all_no_filter_lang/utt2lang
113
  - lid_labels
114
  - text
115
  valid_data_path_and_name_and_type:
116
  - - dump/raw/dev_ml_superb2_lang/wav.scp
117
  - speech
118
  - sound
119
+ - - dump/raw/dev_ml_superb2_lang/utt2lang
120
  - lid_labels
121
  - text
122
  multi_task_dataset: false
 
145
  use_preprocessor: true
146
  input_size: null
147
  target_duration: 3.0
148
+ lang2utt: dump/raw/train_all_no_filter_lang/lang2utt
149
+ lang_num: 157
150
  sample_rate: 16000
151
  num_eval: 10
152
  rir_scp: ''
 
157
  - 36
158
  - 40
159
  - 44
 
 
160
  apply_intermediate_lang2vec_loss: true
 
161
  apply_intermediate_lang2vec_condition: true
 
162
  inter_lang2vec_loss_weight: 0.4
 
163
  cutoff_gradient_from_backbone: false
164
+ cutoff_gradient_before_condproj: true
 
 
 
165
  shared_conditioning_proj: true
166
  frontend: s3prl_condition
167
  frontend_conf:
 
231
  lang2vec_weight: 0.2
232
  required:
233
  - output_dir
234
+ version: '202506'
235
  distributed: false