qingzhengwang commited on
Commit
03f2e41
·
1 Parent(s): d70766b

Fix readme

Browse files
Files changed (1) hide show
  1. README.md +21 -25
README.md CHANGED
@@ -113,14 +113,14 @@ The training utilized a combined dataset, merging five domain-specific corpora,
113
  <details><summary>expand</summary>
114
 
115
  ```
116
- config: /work/nvme/bbjs/qwang20/espnet/egs2/lid_delta/lid1/conf/mms_1b_all_no_filter_balanced_dataset/mms_ecapa_upcon_32_44_it0.4_sharedCondProj_butUpdate_50k_lr1e-5_datasetup0.3_backup_33epoch.yaml
117
  print_config: false
118
  log_level: INFO
119
  drop_last_iter: false
120
  dry_run: false
121
  iterator_type: category
122
  valid_iterator_type: category
123
- output_dir: exp_all_no_filter_raw/spk_mms_ecapa_upcon_32_44_it0.4_sharedCondProj_butUpdate_50k_lr1e-5_datasetup0.3_backup_33epoch_raw
124
  ngpu: 1
125
  seed: 3702
126
  num_workers: 8
@@ -138,6 +138,8 @@ unused_parameters: true
138
  sharded_ddp: false
139
  use_deepspeed: false
140
  deepspeed_config: null
 
 
141
  cudnn_enabled: true
142
  cudnn_benchmark: true
143
  cudnn_deterministic: false
@@ -171,10 +173,10 @@ log_interval: 100
171
  use_matplotlib: true
172
  use_tensorboard: true
173
  create_graph_in_tensorboard: false
174
- use_wandb: true
175
- wandb_project: lid
176
  wandb_id: null
177
- wandb_entity: qingzhew-carnegie-mellon-university
178
  wandb_name: null
179
  wandb_model_log_interval: -1
180
  detect_anomaly: false
@@ -192,16 +194,18 @@ valid_batch_size: null
192
  batch_bins: 1440000
193
  valid_batch_bins: null
194
  category_sample_size: 10
195
- train_shape_file:
196
- - exp_all_no_filter_raw/spk_stats_16k/train/speech_shape
197
- valid_shape_file:
198
- - exp_all_no_filter_raw/spk_stats_16k/valid/speech_shape
199
- batch_type: catpow_balance_dataset
200
  upsampling_factor: 0.5
201
- language_upsampling_factor: 0.5
202
  dataset_upsampling_factor: 0.3
203
  dataset_scaling_factor: 1.2
204
  max_batch_size: 6
 
 
 
 
 
 
 
205
  valid_batch_type: null
206
  fold_length:
207
  - 120000
@@ -220,14 +224,14 @@ train_data_path_and_name_and_type:
220
  - - dump/raw/train_all_no_filter_lang/wav.scp
221
  - speech
222
  - sound
223
- - - dump/raw/train_all_no_filter_lang/utt2spk
224
  - lid_labels
225
  - text
226
  valid_data_path_and_name_and_type:
227
  - - dump/raw/dev_ml_superb2_lang/wav.scp
228
  - speech
229
  - sound
230
- - - dump/raw/dev_ml_superb2_lang/utt2spk
231
  - lid_labels
232
  - text
233
  multi_task_dataset: false
@@ -256,8 +260,8 @@ init: null
256
  use_preprocessor: true
257
  input_size: null
258
  target_duration: 3.0
259
- spk2utt: dump/raw/train_all_no_filter_lang/spk2utt
260
- spk_num: 157
261
  sample_rate: 16000
262
  num_eval: 10
263
  rir_scp: ''
@@ -268,19 +272,11 @@ model_conf:
268
  - 36
269
  - 40
270
  - 44
271
- lid_conditioning_layers: []
272
- frozen_ecapa: false
273
  apply_intermediate_lang2vec_loss: true
274
- apply_intermediate_lid_class_loss: false
275
  apply_intermediate_lang2vec_condition: true
276
- apply_intermediate_lid_class_condition: false
277
  inter_lang2vec_loss_weight: 0.4
278
- inter_lid_class_loss_weight: 0.0
279
  cutoff_gradient_from_backbone: false
280
- cutoff_gradient_before_condtrans: true
281
- independent_module: true
282
- use_gate: false
283
- gate_type: null
284
  shared_conditioning_proj: true
285
  frontend: s3prl_condition
286
  frontend_conf:
@@ -350,7 +346,7 @@ loss_conf:
350
  lang2vec_weight: 0.2
351
  required:
352
  - output_dir
353
- version: '202412'
354
  distributed: false
355
  ```
356
 
 
113
  <details><summary>expand</summary>
114
 
115
  ```
116
+ config: conf/combined/mms_ecapa_upcon_32_44_it0.4_shared_trainable_dev.yaml
117
  print_config: false
118
  log_level: INFO
119
  drop_last_iter: false
120
  dry_run: false
121
  iterator_type: category
122
  valid_iterator_type: category
123
+ output_dir: exp_combined/lid_mms_ecapa_upcon_32_44_it0.4_shared_trainable_dev_raw
124
  ngpu: 1
125
  seed: 3702
126
  num_workers: 8
 
138
  sharded_ddp: false
139
  use_deepspeed: false
140
  deepspeed_config: null
141
+ gradient_as_bucket_view: true
142
+ ddp_comm_hook: null
143
  cudnn_enabled: true
144
  cudnn_benchmark: true
145
  cudnn_deterministic: false
 
173
  use_matplotlib: true
174
  use_tensorboard: true
175
  create_graph_in_tensorboard: false
176
+ use_wandb: false
177
+ wandb_project: null
178
  wandb_id: null
179
+ wandb_entity: null
180
  wandb_name: null
181
  wandb_model_log_interval: -1
182
  detect_anomaly: false
 
194
  batch_bins: 1440000
195
  valid_batch_bins: null
196
  category_sample_size: 10
 
 
 
 
 
197
  upsampling_factor: 0.5
198
+ category_upsampling_factor: 0.5
199
  dataset_upsampling_factor: 0.3
200
  dataset_scaling_factor: 1.2
201
  max_batch_size: 6
202
+ min_batch_size: 1
203
+ train_shape_file:
204
+ - exp_combined/lid_stats_16k/train/speech_shape
205
+ valid_shape_file:
206
+ - exp_combined/lid_stats_16k/valid/speech_shape
207
+ batch_type: catpow_balance_dataset
208
+ language_upsampling_factor: 0.5
209
  valid_batch_type: null
210
  fold_length:
211
  - 120000
 
224
  - - dump/raw/train_all_no_filter_lang/wav.scp
225
  - speech
226
  - sound
227
+ - - dump/raw/train_all_no_filter_lang/utt2lang
228
  - lid_labels
229
  - text
230
  valid_data_path_and_name_and_type:
231
  - - dump/raw/dev_ml_superb2_lang/wav.scp
232
  - speech
233
  - sound
234
+ - - dump/raw/dev_ml_superb2_lang/utt2lang
235
  - lid_labels
236
  - text
237
  multi_task_dataset: false
 
260
  use_preprocessor: true
261
  input_size: null
262
  target_duration: 3.0
263
+ lang2utt: dump/raw/train_all_no_filter_lang/lang2utt
264
+ lang_num: 157
265
  sample_rate: 16000
266
  num_eval: 10
267
  rir_scp: ''
 
272
  - 36
273
  - 40
274
  - 44
 
 
275
  apply_intermediate_lang2vec_loss: true
 
276
  apply_intermediate_lang2vec_condition: true
 
277
  inter_lang2vec_loss_weight: 0.4
 
278
  cutoff_gradient_from_backbone: false
279
+ cutoff_gradient_before_condproj: true
 
 
 
280
  shared_conditioning_proj: true
281
  frontend: s3prl_condition
282
  frontend_conf:
 
346
  lang2vec_weight: 0.2
347
  required:
348
  - output_dir
349
+ version: '202506'
350
  distributed: false
351
  ```
352