ZiweiLi commited on
Commit
f945760
·
1 Parent(s): f366ad1

add model and config

Browse files
Files changed (6) hide show
  1. .gitattributes +2 -0
  2. best-3.pt +3 -0
  3. config.json +42 -0
  4. hyper-p.json +70 -0
  5. lexicon_mul10.txt +3 -0
  6. tokenizer_mul10.tknz +3 -0
.gitattributes CHANGED
@@ -33,3 +33,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ *.txt filter=lfs diff=lfs merge=lfs -text
37
+ *.tknz filter=lfs diff=lfs merge=lfs -text
best-3.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c56031e62889ab9b759b269f3ddc3f5796c3511df0b7bc55e7d251c82bb67408
3
+ size 875628375
config.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "specaug": {
3
+ "freq_mask_width_range": 0.35,
4
+ "num_freq_mask": 2,
5
+ "num_time_mask": 10,
6
+ "time_mask_width_range": 0.05
7
+ },
8
+ "encoder": {
9
+ "type": "ConformerNet",
10
+ "kwargs": {
11
+ "num_cells": 22,
12
+ "idim": 80,
13
+ "hdim": 640,
14
+ "conv": "vgg2l",
15
+ "num_heads": 4,
16
+ "d_head": 160,
17
+ "kernel_size": 15,
18
+ "num_classes": 75
19
+ }
20
+ },
21
+ "scheduler": {
22
+ "type": "SchedulerNoamEarlyStop",
23
+ "kwargs": {
24
+ "warmup_step": 20000,
25
+ "min_step": 30000,
26
+ "dim_model": 640,
27
+ "peak_factor": 1.0,
28
+ "n_tol": 50
29
+ },
30
+ "optimizer": {
31
+ "type": "Adam",
32
+ "kwargs": {
33
+ "lr": 0.0003,
34
+ "betas": [
35
+ 0.9,
36
+ 0.98
37
+ ],
38
+ "weight_decay": 1e-06
39
+ }
40
+ }
41
+ }
42
+ }
hyper-p.json ADDED
@@ -0,0 +1,70 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "data": {
3
+ "dev": [
4
+ "dev_en_mul",
5
+ "dev_es_mul",
6
+ "dev_fr_mul",
7
+ "dev_it_mul",
8
+ "dev_ky_mul",
9
+ "dev_ru_mul",
10
+ "dev_nl_mul",
11
+ "dev_tt_mul",
12
+ "dev_tr_mul",
13
+ "dev_sv-SE_mul"
14
+ ],
15
+ "test": [
16
+ "test_en_mul",
17
+ "test_es_mul",
18
+ "test_fr_mul",
19
+ "test_it_mul",
20
+ "test_ky_mul",
21
+ "test_ru_mul",
22
+ "test_nl_mul",
23
+ "test_tt_mul",
24
+ "test_tr_mul",
25
+ "test_sv-SE_mul"
26
+ ],
27
+ "filter": "10:1200"
28
+ },
29
+ "tokenizer": {
30
+ "type": "LexiconTokenizer",
31
+ "option-init": {
32
+ "lexicon": "dict/ten/lexicon_mul10.txt"
33
+ },
34
+ "file": "dict/ten/tokenizer_mul10.tknz",
35
+ "|V|": 75
36
+ },
37
+ "env": {
38
+ "CUDA_VISIBLE_DEVICES": "0,1,2,3,4,5,6,7,8,9"
39
+ },
40
+ "train": {
41
+ "bin": "cat.ctc.train",
42
+ "option": {
43
+ "amp": true,
44
+ "batch_size": 320,
45
+ "grad_norm": 5.0,
46
+ "grad_accum_fold": 2,
47
+ "check_freq": 500,
48
+ "large-dataset": true,
49
+ "ld": "data/*/{11_1000,1001_1200}/*.tar"
50
+ }
51
+ },
52
+ "inference": {
53
+ "avgmodel": {
54
+ "mode": "best",
55
+ "num": 3
56
+ },
57
+ "infer": {
58
+ "bin": "cat.ctc.decode",
59
+ "option": {
60
+ "beam_size": 16,
61
+ "nj": 16,
62
+ "store_ark": true
63
+ }
64
+ },
65
+ "er": {
66
+ "per": true
67
+ }
68
+ },
69
+ "commit": "1b77bc21f7a5faac5e47f6bc4445f23ebf0e0633"
70
+ }
lexicon_mul10.txt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae10e0c8cc66da6ae110745601977e2a46afdb4d398246f4884e2922429a8d22
3
+ size 21985313
tokenizer_mul10.tknz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4be8c9593ae6afc772067554022481c53dc5ea2cd889d1036e992bb02c493130
3
+ size 24304800