ASLP-lab
/

WSYue-ASR

Model card Files Files and versions

ASLP-lab commited on Aug 30, 2025

Commit

e56d177

·

verified ·

1 Parent(s): 391b67b

Upload 2 files

Files changed (2) hide show

u2pp_conformer_yue/bpe.model +3 -0
u2pp_conformer_yue/train.yaml +95 -0

u2pp_conformer_yue/bpe.model ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ee1b3b4dbe74bbad77f76efd271577db44377ca5a502a8aa44ac4d7dfd58c2d2
+size 253122

u2pp_conformer_yue/train.yaml ADDED Viewed

	@@ -0,0 +1,95 @@

+accum_grad: 4
+ctc: ctc
+ctc_conf:
+  ctc_blank_id: 0
+dataset_conf:
+  batch_conf:
+    batch_type: dynamic
+    max_frames_in_batch: 36000
+  fbank_conf:
+    dither: 0.1
+    frame_length: 25
+    frame_shift: 10
+    num_mel_bins: 80
+  filter_conf:
+    max_length: 10240
+    min_length: 10
+    token_max_length: 200
+    token_min_length: 1
+  resample_conf:
+    resample_rate: 16000
+  shuffle: true
+  shuffle_conf:
+    shuffle_size: 1500
+  sort: true
+  sort_conf:
+    sort_size: 500
+  spec_aug: true
+  spec_aug_conf:
+    max_f: 10
+    max_t: 50
+    num_f_mask: 2
+    num_t_mask: 2
+  speed_perturb: true
+decoder: bitransformer
+decoder_conf:
+  attention_heads: 8
+  dropout_rate: 0.1
+  linear_units: 2048
+  num_blocks: 3
+  positional_dropout_rate: 0.1
+  r_num_blocks: 3
+  self_attention_dropout_rate: 0.1
+  src_attention_dropout_rate: 0.1
+dtype: fp32
+encoder: conformer
+encoder_conf:
+  activation_type: swish
+  attention_dropout_rate: 0.1
+  attention_heads: 8
+  cnn_module_kernel: 15
+  dropout_rate: 0.1
+  input_layer: conv2d
+  linear_units: 2048
+  normalize_before: true
+  num_blocks: 12
+  output_size: 512
+  pos_enc_layer_type: rel_pos
+  positional_dropout_rate: 0.1
+  selfattention_layer_type: rel_selfattn
+  use_cnn_module: true
+grad_clip: 5
+input_dim: 80
+log_interval: 100
+max_epoch: 20
+model: asr_model
+model_conf:
+  ctc_weight: 0.3
+  length_normalized_loss: false
+  lsm_weight: 0.1
+  reverse_weight: 0.3
+model_dir: /home/work_nfs17/lhli/workspace/checkpoint/WenetSpeech_Yue_open_source
+optim: adam
+optim_conf:
+  lr: 0.001
+output_dim: 8629
+save_states: model_only
+scheduler: warmuplr
+scheduler_conf:
+  warmup_steps: 25000
+tokenizer: bpe
+tokenizer_conf:
+  bpe_path: bpe.model
+  is_multilingual: true
+  non_lang_syms_path: null
+  num_languages: 2
+  special_tokens:
+    <blank>: 0
+    <eos>: 8628
+    <sos>: 8628
+    <unk>: 1
+  split_with_space: false
+  symbol_table_path: data/dict_bpe/lang_char.txt
+train_engine: torch_ddp
+use_amp: false
+vocab_size: 8629