Automatic Speech Recognition
multilingual
DataoceanAI commited on
Commit
bf48921
·
verified ·
1 Parent(s): d0b2cc7

upload train config and vocabulary

Browse files
Files changed (2) hide show
  1. train.yaml +114 -0
  2. units.txt +0 -0
train.yaml ADDED
@@ -0,0 +1,114 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ accum_grad: 8
2
+ cmvn: global_mvn
3
+ cmvn_conf:
4
+ cmvn_file: /data/models/dolphin-small/feats_stats.npz
5
+ ctc: ctc
6
+ ctc_conf:
7
+ ctc_blank_id: 0
8
+ dataset: asr
9
+ dataset_conf:
10
+ batch_conf:
11
+ batch_size: 16
12
+ batch_type: static
13
+ ctc_label: true
14
+ cycle: 100
15
+ fbank_conf:
16
+ dither: 0.1
17
+ frame_length: 25
18
+ frame_shift: 10
19
+ num_mel_bins: 80
20
+ frontend_conf:
21
+ n_fft: 512
22
+ win_length: 400
23
+ hop_length: 160
24
+ fs: 16000
25
+ filter_conf:
26
+ max_length: 3000
27
+ min_length: 0
28
+ token_max_length: 200
29
+ token_min_length: 1
30
+ no_time_idx: 3
31
+ remove_punctuation: true
32
+ remove_timestamp: true
33
+ resample_conf:
34
+ resample_rate: 16000
35
+ shuffle: true
36
+ shuffle_conf:
37
+ shuffle_size: 5120
38
+ sort: true
39
+ sort_conf:
40
+ sort_size: 2048
41
+ spec_aug: true
42
+ spec_aug_conf:
43
+ max_f: 10
44
+ max_t: 50
45
+ num_f_mask: 2
46
+ num_t_mask: 2
47
+ speed_perturb: true
48
+ time_apply_prob: 0.0
49
+ decoder: transformer
50
+ decoder_conf:
51
+ attention_heads: 8
52
+ dropout_rate: 0.1
53
+ linear_units: 2048
54
+ num_blocks: 6
55
+ positional_dropout_rate: 0.1
56
+ self_attention_dropout_rate: 0.1
57
+ src_attention_dropout_rate: 0.1
58
+ use_sdpa: false
59
+ dtype: fp32
60
+ encoder: e_branchformer
61
+ encoder_conf:
62
+ activation_type: swish
63
+ attention_dropout_rate: 0.1
64
+ attention_heads: 8
65
+ causal: false
66
+ cgmlp_conv_kernel: 31
67
+ cgmlp_linear_units: 2048
68
+ dropout_rate: 0.1
69
+ gate_activation: identity
70
+ input_layer: conv2d
71
+ linear_units: 2048
72
+ merge_conv_kernel: 31
73
+ num_blocks: 6
74
+ output_size: 512
75
+ pos_enc_layer_type: rel_pos_v1
76
+ positional_dropout_rate: 0.1
77
+ selfattention_layer_type: rel_selfattn
78
+ use_linear_after_conv: false
79
+ use_sdpa: false
80
+ grad_clip: 5
81
+ input_dim: 80
82
+ log_interval: 200
83
+ max_epoch: 100
84
+ model: asr_model
85
+ model_conf:
86
+ ctc_weight: 0.3
87
+ length_normalized_loss: false
88
+ lsm_weight: 0.1
89
+ model_dir: exp/dolphin_ebf_small_nonstreaming_v4.3
90
+ optim: adam
91
+ optim_conf:
92
+ lr: 0.0005
93
+ output_dim: 40002
94
+ save_interval: 1000
95
+ save_states: model_only
96
+ scheduler: warmuplr
97
+ scheduler_conf:
98
+ warmup_steps: 2048
99
+ stats_dialect: true
100
+ tokenizer: bpe
101
+ tokenizer_conf:
102
+ bpe_path: /data/models/dolphin-small/bpe.model
103
+ symbol_table_path: /data/models/dolphin-small/units.txt
104
+ special_tokens:
105
+ <asr>: 6
106
+ <blank>: 0
107
+ <eos>: 40000
108
+ <sos>: 39999
109
+ <unk>: 1
110
+ train_engine: torch_ddp
111
+ use_amp: false
112
+ vocab_size: 40002
113
+ layer_norm_eps: 1e-12
114
+ support_timestamp: true
units.txt ADDED
The diff for this file is too large to render. See raw diff