Tiance Wang
commited on
Commit
·
dd8f83d
1
Parent(s):
2e07765
upload decode results and train logs
Browse files- data/lang_phone/lexicon.txt +0 -0
- data/lang_phone/lexicon_disambig.txt +0 -0
- data/lang_phone/tokens.txt +88 -0
- data/lang_phone/words.txt +0 -0
- decoding-results/nbest-oracle/errs-test-clean-oracle_50_nbest_scale_1.0.txt +0 -0
- decoding-results/nbest-oracle/errs-test-other-oracle_50_nbest_scale_1.0.txt +0 -0
- decoding-results/nbest-oracle/log-decode-2022-08-16-19-07-58 +29 -0
- decoding-results/nbest-oracle/recogs-test-clean-oracle_50_nbest_scale_1.0.txt +0 -0
- decoding-results/nbest-oracle/recogs-test-other-oracle_50_nbest_scale_1.0.txt +0 -0
- decoding-results/nbest-rescoring/errs-test-clean-lm_scale_0.7.txt +0 -0
- decoding-results/nbest-rescoring/errs-test-other-lm_scale_0.7.txt +0 -0
- decoding-results/nbest-rescoring/log-decode-2022-08-16-18-58-48 +78 -0
- decoding-results/nbest-rescoring/recogs-test-clean-lm_scale_0.7.txt +0 -0
- decoding-results/nbest-rescoring/recogs-test-other-lm_scale_0.7.txt +0 -0
- decoding-results/one-best/errs-test-clean-no_rescore.txt +0 -0
- decoding-results/one-best/errs-test-other-no_rescore.txt +0 -0
- decoding-results/one-best/log-decode-2022-08-16-18-55-20 +29 -0
- decoding-results/one-best/recogs-test-clean-no_rescore.txt +0 -0
- decoding-results/one-best/recogs-test-other-no_rescore.txt +0 -0
- decoding-results/whole-lattice-rescoring/errs-test-clean-lm_scale_0.8.txt +0 -0
- decoding-results/whole-lattice-rescoring/errs-test-other-lm_scale_0.8.txt +0 -0
- decoding-results/whole-lattice-rescoring/log-decode-2022-08-16-19-11-22 +0 -0
- decoding-results/whole-lattice-rescoring/recogs-test-clean-lm_scale_0.8.txt +0 -0
- decoding-results/whole-lattice-rescoring/recogs-test-other-lm_scale_0.8.txt +0 -0
- tensorboard_log/events.out.tfevents.1659925381.dgxs-01.cluster.thspzh.com.18736.0 +3 -0
- tensorboard_log/events.out.tfevents.1659926695.dgxs-01.cluster.thspzh.com.27410.0 +3 -0
- tensorboard_log/events.out.tfevents.1659927762.dgxs-01.cluster.thspzh.com.34561.0 +3 -0
- tensorboard_log/events.out.tfevents.1659928526.dgxs-01.cluster.thspzh.com.39902.0 +3 -0
- tensorboard_log/events.out.tfevents.1659929206.dgxs-01.cluster.thspzh.com.4352.0 +3 -0
- tensorboard_log/events.out.tfevents.1659930110.dgxs-01.cluster.thspzh.com.10312.0 +3 -0
- tensorboard_log/events.out.tfevents.1659931044.dgxs-01.cluster.thspzh.com.16831.0 +3 -0
- tensorboard_log/events.out.tfevents.1659940194.dgxs-01.cluster.thspzh.com.37638.0 +3 -0
- tensorboard_log/events.out.tfevents.1659941396.dgxs-01.cluster.thspzh.com.5637.0 +3 -0
- tensorboard_log/events.out.tfevents.1660034714.dgxs-01.cluster.thspzh.com.3516.0 +3 -0
- tensorboard_log/events.out.tfevents.1660179164.dgxs-01.cluster.thspzh.com.14444.0 +3 -0
- tensorboard_log/events.out.tfevents.1660215232.dgxs-01.cluster.thspzh.com.3323.0 +3 -0
data/lang_phone/lexicon.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
data/lang_phone/lexicon_disambig.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
data/lang_phone/tokens.txt
ADDED
|
@@ -0,0 +1,88 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
<eps> 0
|
| 2 |
+
AA0 1
|
| 3 |
+
AA1 2
|
| 4 |
+
AA2 3
|
| 5 |
+
AE0 4
|
| 6 |
+
AE1 5
|
| 7 |
+
AE2 6
|
| 8 |
+
AH0 7
|
| 9 |
+
AH1 8
|
| 10 |
+
AH2 9
|
| 11 |
+
AO0 10
|
| 12 |
+
AO1 11
|
| 13 |
+
AO2 12
|
| 14 |
+
AW0 13
|
| 15 |
+
AW1 14
|
| 16 |
+
AW2 15
|
| 17 |
+
AY0 16
|
| 18 |
+
AY1 17
|
| 19 |
+
AY2 18
|
| 20 |
+
B 19
|
| 21 |
+
CH 20
|
| 22 |
+
D 21
|
| 23 |
+
DH 22
|
| 24 |
+
EH0 23
|
| 25 |
+
EH1 24
|
| 26 |
+
EH2 25
|
| 27 |
+
ER0 26
|
| 28 |
+
ER1 27
|
| 29 |
+
ER2 28
|
| 30 |
+
EY0 29
|
| 31 |
+
EY1 30
|
| 32 |
+
EY2 31
|
| 33 |
+
F 32
|
| 34 |
+
G 33
|
| 35 |
+
HH 34
|
| 36 |
+
IH0 35
|
| 37 |
+
IH1 36
|
| 38 |
+
IH2 37
|
| 39 |
+
IY0 38
|
| 40 |
+
IY1 39
|
| 41 |
+
IY2 40
|
| 42 |
+
JH 41
|
| 43 |
+
K 42
|
| 44 |
+
L 43
|
| 45 |
+
M 44
|
| 46 |
+
N 45
|
| 47 |
+
NG 46
|
| 48 |
+
OW0 47
|
| 49 |
+
OW1 48
|
| 50 |
+
OW2 49
|
| 51 |
+
OY0 50
|
| 52 |
+
OY1 51
|
| 53 |
+
OY2 52
|
| 54 |
+
P 53
|
| 55 |
+
R 54
|
| 56 |
+
S 55
|
| 57 |
+
SH 56
|
| 58 |
+
SIL 57
|
| 59 |
+
SPN 58
|
| 60 |
+
T 59
|
| 61 |
+
TH 60
|
| 62 |
+
UH0 61
|
| 63 |
+
UH1 62
|
| 64 |
+
UH2 63
|
| 65 |
+
UW0 64
|
| 66 |
+
UW1 65
|
| 67 |
+
UW2 66
|
| 68 |
+
V 67
|
| 69 |
+
W 68
|
| 70 |
+
Y 69
|
| 71 |
+
Z 70
|
| 72 |
+
ZH 71
|
| 73 |
+
#0 72
|
| 74 |
+
#1 73
|
| 75 |
+
#2 74
|
| 76 |
+
#3 75
|
| 77 |
+
#4 76
|
| 78 |
+
#5 77
|
| 79 |
+
#6 78
|
| 80 |
+
#7 79
|
| 81 |
+
#8 80
|
| 82 |
+
#9 81
|
| 83 |
+
#10 82
|
| 84 |
+
#11 83
|
| 85 |
+
#12 84
|
| 86 |
+
#13 85
|
| 87 |
+
#14 86
|
| 88 |
+
#15 87
|
data/lang_phone/words.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
decoding-results/nbest-oracle/errs-test-clean-oracle_50_nbest_scale_1.0.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
decoding-results/nbest-oracle/errs-test-other-oracle_50_nbest_scale_1.0.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
decoding-results/nbest-oracle/log-decode-2022-08-16-19-07-58
ADDED
|
@@ -0,0 +1,29 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
2022-08-16 19:07:58,178 INFO [decode.py:579] Decoding started
|
| 2 |
+
2022-08-16 19:07:58,178 INFO [decode.py:580] {'subsampling_factor': 4, 'feature_dim': 80, 'search_beam': 20, 'output_beam': 8, 'min_active_states': 30, 'max_active_states': 10000, 'use_double_scores': True, 'env_info': {'k2-version': '1.18', 'k2-build-type': 'Release', 'k2-with-cuda': True, 'k2-git-sha1': '2d82a1d9350263ae48a6953034ce570e3d5208c1', 'k2-git-date': 'Mon Aug 15 02:09:05 2022', 'lhotse-version': '1.4.0.dev+git.94e9ed9.clean', 'torch-version': '1.11.0', 'torch-cuda-available': True, 'torch-cuda-version': '11.3', 'python-version': '3.8', 'icefall-git-branch': 'lightweight', 'icefall-git-sha1': 'eb99d97-dirty', 'icefall-git-date': 'Tue Aug 16 16:04:39 2022', 'icefall-path': '/thspfs/home/acct-hpc/thspzh-hpc1/git/icefall_dev', 'k2-path': '/raid/conda/envs/k2a100/lib/python3.8/site-packages/k2/__init__.py', 'lhotse-path': '/raid/conda/envs/k2a100/lib/python3.8/site-packages/lhotse/__init__.py', 'hostname': 'dgx-04.cluster.thspzh.com', 'IP address': '192.168.200.39'}, 'epoch': 9999, 'iter': 0, 'avg': 1, 'method': 'nbest-oracle', 'use_averaged_model': False, 'num_paths': 50, 'nbest_scale': 1.0, 'exp_dir': PosixPath('lightweight_ctc/exp_phone'), 'lang_dir': PosixPath('data/lang_phone'), 'lm_dir': PosixPath('data/lm'), 'first_out_channels': 8, 'conv_blocks': 3, 'rnn_dim': 0, 'full_libri': True, 'manifest_dir': PosixPath('data/fbank'), 'max_duration': 100, 'bucketing_sampler': True, 'num_buckets': 30, 'concatenate_cuts': False, 'duration_factor': 1.0, 'gap': 1.0, 'on_the_fly_feats': False, 'shuffle': True, 'drop_last': True, 'return_cuts': True, 'num_workers': 2, 'enable_spec_aug': True, 'spec_aug_time_warp_factor': 80, 'enable_musan': True, 'input_strategy': 'PrecomputedFeatures'}
|
| 3 |
+
2022-08-16 19:07:58,434 INFO [lexicon.py:176] Loading pre-compiled data/lang_phone/Linv.pt
|
| 4 |
+
2022-08-16 19:07:58,784 INFO [decode.py:590] device: cuda:0
|
| 5 |
+
2022-08-16 19:08:28,989 INFO [checkpoint.py:112] Loading checkpoint from lightweight_ctc/exp_phone/epoch-9999.pt
|
| 6 |
+
2022-08-16 19:08:29,243 INFO [decode.py:752] Number of model parameters: 1766904
|
| 7 |
+
2022-08-16 19:08:29,243 INFO [asr_datamodule.py:444] About to get test-clean cuts
|
| 8 |
+
2022-08-16 19:08:29,287 INFO [asr_datamodule.py:451] About to get test-other cuts
|
| 9 |
+
2022-08-16 19:08:31,771 INFO [decode.py:513] batch 0/?, cuts processed until now is 7
|
| 10 |
+
2022-08-16 19:08:46,365 INFO [decode.py:513] batch 100/?, cuts processed until now is 1218
|
| 11 |
+
2022-08-16 19:09:05,621 INFO [decode.py:513] batch 200/?, cuts processed until now is 2525
|
| 12 |
+
2022-08-16 19:09:06,722 INFO [decode.py:535] The transcripts are stored in lightweight_ctc/exp_phone/decode-nbest-oracle/recogs-test-clean-oracle_50_nbest_scale_1.0.txt
|
| 13 |
+
2022-08-16 19:09:06,777 INFO [utils.py:428] [test-clean-oracle_50_nbest_scale_1.0] %WER 5.87% [3085 / 52576, 129 ins, 824 del, 2132 sub ]
|
| 14 |
+
2022-08-16 19:09:06,922 INFO [decode.py:547] Wrote detailed error stats to lightweight_ctc/exp_phone/decode-nbest-oracle/errs-test-clean-oracle_50_nbest_scale_1.0.txt
|
| 15 |
+
2022-08-16 19:09:06,924 INFO [decode.py:563]
|
| 16 |
+
For test-clean, WER of different settings are:
|
| 17 |
+
oracle_50_nbest_scale_1.0 5.87 best for test-clean
|
| 18 |
+
|
| 19 |
+
2022-08-16 19:09:07,703 INFO [decode.py:513] batch 0/?, cuts processed until now is 9
|
| 20 |
+
2022-08-16 19:09:28,819 INFO [decode.py:513] batch 100/?, cuts processed until now is 1400
|
| 21 |
+
2022-08-16 19:09:54,731 INFO [decode.py:513] batch 200/?, cuts processed until now is 2898
|
| 22 |
+
2022-08-16 19:09:55,424 INFO [decode.py:535] The transcripts are stored in lightweight_ctc/exp_phone/decode-nbest-oracle/recogs-test-other-oracle_50_nbest_scale_1.0.txt
|
| 23 |
+
2022-08-16 19:09:55,484 INFO [utils.py:428] [test-other-oracle_50_nbest_scale_1.0] %WER 19.32% [10113 / 52343, 229 ins, 3803 del, 6081 sub ]
|
| 24 |
+
2022-08-16 19:09:55,636 INFO [decode.py:547] Wrote detailed error stats to lightweight_ctc/exp_phone/decode-nbest-oracle/errs-test-other-oracle_50_nbest_scale_1.0.txt
|
| 25 |
+
2022-08-16 19:09:55,639 INFO [decode.py:563]
|
| 26 |
+
For test-other, WER of different settings are:
|
| 27 |
+
oracle_50_nbest_scale_1.0 19.32 best for test-other
|
| 28 |
+
|
| 29 |
+
2022-08-16 19:09:55,639 INFO [decode.py:783] Done!
|
decoding-results/nbest-oracle/recogs-test-clean-oracle_50_nbest_scale_1.0.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
decoding-results/nbest-oracle/recogs-test-other-oracle_50_nbest_scale_1.0.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
decoding-results/nbest-rescoring/errs-test-clean-lm_scale_0.7.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
decoding-results/nbest-rescoring/errs-test-other-lm_scale_0.7.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
decoding-results/nbest-rescoring/log-decode-2022-08-16-18-58-48
ADDED
|
@@ -0,0 +1,78 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
2022-08-16 18:58:48,677 INFO [decode.py:579] Decoding started
|
| 2 |
+
2022-08-16 18:58:48,677 INFO [decode.py:580] {'subsampling_factor': 4, 'feature_dim': 80, 'search_beam': 20, 'output_beam': 8, 'min_active_states': 30, 'max_active_states': 10000, 'use_double_scores': True, 'env_info': {'k2-version': '1.18', 'k2-build-type': 'Release', 'k2-with-cuda': True, 'k2-git-sha1': '2d82a1d9350263ae48a6953034ce570e3d5208c1', 'k2-git-date': 'Mon Aug 15 02:09:05 2022', 'lhotse-version': '1.4.0.dev+git.94e9ed9.clean', 'torch-version': '1.11.0', 'torch-cuda-available': True, 'torch-cuda-version': '11.3', 'python-version': '3.8', 'icefall-git-branch': 'lightweight', 'icefall-git-sha1': 'eb99d97-dirty', 'icefall-git-date': 'Tue Aug 16 16:04:39 2022', 'icefall-path': '/thspfs/home/acct-hpc/thspzh-hpc1/git/icefall_dev', 'k2-path': '/raid/conda/envs/k2a100/lib/python3.8/site-packages/k2/__init__.py', 'lhotse-path': '/raid/conda/envs/k2a100/lib/python3.8/site-packages/lhotse/__init__.py', 'hostname': 'dgx-04.cluster.thspzh.com', 'IP address': '192.168.200.39'}, 'epoch': 9999, 'iter': 0, 'avg': 1, 'method': 'nbest-rescoring', 'use_averaged_model': False, 'num_paths': 50, 'nbest_scale': 1.0, 'exp_dir': PosixPath('lightweight_ctc/exp_phone'), 'lang_dir': PosixPath('data/lang_phone'), 'lm_dir': PosixPath('data/lm'), 'first_out_channels': 8, 'conv_blocks': 3, 'rnn_dim': 0, 'full_libri': True, 'manifest_dir': PosixPath('data/fbank'), 'max_duration': 100, 'bucketing_sampler': True, 'num_buckets': 30, 'concatenate_cuts': False, 'duration_factor': 1.0, 'gap': 1.0, 'on_the_fly_feats': False, 'shuffle': True, 'drop_last': True, 'return_cuts': True, 'num_workers': 2, 'enable_spec_aug': True, 'spec_aug_time_warp_factor': 80, 'enable_musan': True, 'input_strategy': 'PrecomputedFeatures'}
|
| 3 |
+
2022-08-16 18:58:48,943 INFO [lexicon.py:176] Loading pre-compiled data/lang_phone/Linv.pt
|
| 4 |
+
2022-08-16 18:58:49,343 INFO [decode.py:590] device: cuda:0
|
| 5 |
+
2022-08-16 18:59:16,887 INFO [decode.py:642] Loading pre-compiled G_4_gram.pt
|
| 6 |
+
2022-08-16 18:59:50,447 INFO [checkpoint.py:112] Loading checkpoint from lightweight_ctc/exp_phone/epoch-9999.pt
|
| 7 |
+
2022-08-16 18:59:50,632 INFO [decode.py:752] Number of model parameters: 1766904
|
| 8 |
+
2022-08-16 18:59:50,632 INFO [asr_datamodule.py:444] About to get test-clean cuts
|
| 9 |
+
2022-08-16 18:59:50,665 INFO [asr_datamodule.py:451] About to get test-other cuts
|
| 10 |
+
2022-08-16 18:59:53,411 INFO [decode.py:513] batch 0/?, cuts processed until now is 7
|
| 11 |
+
2022-08-16 19:00:50,654 INFO [decode.py:513] batch 100/?, cuts processed until now is 1218
|
| 12 |
+
2022-08-16 19:01:51,594 INFO [decode.py:513] batch 200/?, cuts processed until now is 2525
|
| 13 |
+
2022-08-16 19:01:55,309 INFO [decode.py:535] The transcripts are stored in lightweight_ctc/exp_phone/decode-nbest-rescoring/recogs-test-clean-lm_scale_0.5.txt
|
| 14 |
+
2022-08-16 19:01:55,368 INFO [utils.py:428] [test-clean-lm_scale_0.5] %WER 9.11% [4789 / 52576, 513 ins, 754 del, 3522 sub ]
|
| 15 |
+
2022-08-16 19:01:55,592 INFO [decode.py:547] Wrote detailed error stats to lightweight_ctc/exp_phone/decode-nbest-rescoring/errs-test-clean-lm_scale_0.5.txt
|
| 16 |
+
2022-08-16 19:01:55,629 INFO [decode.py:535] The transcripts are stored in lightweight_ctc/exp_phone/decode-nbest-rescoring/recogs-test-clean-lm_scale_0.6.txt
|
| 17 |
+
2022-08-16 19:01:55,685 INFO [utils.py:428] [test-clean-lm_scale_0.6] %WER 8.87% [4665 / 52576, 474 ins, 788 del, 3403 sub ]
|
| 18 |
+
2022-08-16 19:01:55,832 INFO [decode.py:547] Wrote detailed error stats to lightweight_ctc/exp_phone/decode-nbest-rescoring/errs-test-clean-lm_scale_0.6.txt
|
| 19 |
+
2022-08-16 19:01:55,860 INFO [decode.py:535] The transcripts are stored in lightweight_ctc/exp_phone/decode-nbest-rescoring/recogs-test-clean-lm_scale_0.7.txt
|
| 20 |
+
2022-08-16 19:01:55,915 INFO [utils.py:428] [test-clean-lm_scale_0.7] %WER 8.78% [4617 / 52576, 441 ins, 834 del, 3342 sub ]
|
| 21 |
+
2022-08-16 19:01:56,061 INFO [decode.py:547] Wrote detailed error stats to lightweight_ctc/exp_phone/decode-nbest-rescoring/errs-test-clean-lm_scale_0.7.txt
|
| 22 |
+
2022-08-16 19:01:56,089 INFO [decode.py:535] The transcripts are stored in lightweight_ctc/exp_phone/decode-nbest-rescoring/recogs-test-clean-lm_scale_0.8.txt
|
| 23 |
+
2022-08-16 19:01:56,143 INFO [utils.py:428] [test-clean-lm_scale_0.8] %WER 8.83% [4642 / 52576, 415 ins, 920 del, 3307 sub ]
|
| 24 |
+
2022-08-16 19:01:56,290 INFO [decode.py:547] Wrote detailed error stats to lightweight_ctc/exp_phone/decode-nbest-rescoring/errs-test-clean-lm_scale_0.8.txt
|
| 25 |
+
2022-08-16 19:01:56,318 INFO [decode.py:535] The transcripts are stored in lightweight_ctc/exp_phone/decode-nbest-rescoring/recogs-test-clean-lm_scale_0.9.txt
|
| 26 |
+
2022-08-16 19:01:56,374 INFO [utils.py:428] [test-clean-lm_scale_0.9] %WER 8.88% [4667 / 52576, 382 ins, 1001 del, 3284 sub ]
|
| 27 |
+
2022-08-16 19:01:56,518 INFO [decode.py:547] Wrote detailed error stats to lightweight_ctc/exp_phone/decode-nbest-rescoring/errs-test-clean-lm_scale_0.9.txt
|
| 28 |
+
2022-08-16 19:01:56,545 INFO [decode.py:535] The transcripts are stored in lightweight_ctc/exp_phone/decode-nbest-rescoring/recogs-test-clean-lm_scale_1.0.txt
|
| 29 |
+
2022-08-16 19:01:56,599 INFO [utils.py:428] [test-clean-lm_scale_1.0] %WER 9.02% [4741 / 52576, 352 ins, 1103 del, 3286 sub ]
|
| 30 |
+
2022-08-16 19:01:56,809 INFO [decode.py:547] Wrote detailed error stats to lightweight_ctc/exp_phone/decode-nbest-rescoring/errs-test-clean-lm_scale_1.0.txt
|
| 31 |
+
2022-08-16 19:01:56,839 INFO [decode.py:535] The transcripts are stored in lightweight_ctc/exp_phone/decode-nbest-rescoring/recogs-test-clean-lm_scale_1.1.txt
|
| 32 |
+
2022-08-16 19:01:56,896 INFO [utils.py:428] [test-clean-lm_scale_1.1] %WER 9.26% [4869 / 52576, 337 ins, 1194 del, 3338 sub ]
|
| 33 |
+
2022-08-16 19:01:57,046 INFO [decode.py:547] Wrote detailed error stats to lightweight_ctc/exp_phone/decode-nbest-rescoring/errs-test-clean-lm_scale_1.1.txt
|
| 34 |
+
2022-08-16 19:01:57,053 INFO [decode.py:563]
|
| 35 |
+
For test-clean, WER of different settings are:
|
| 36 |
+
lm_scale_0.7 8.78 best for test-clean
|
| 37 |
+
lm_scale_0.8 8.83
|
| 38 |
+
lm_scale_0.6 8.87
|
| 39 |
+
lm_scale_0.9 8.88
|
| 40 |
+
lm_scale_1.0 9.02
|
| 41 |
+
lm_scale_0.5 9.11
|
| 42 |
+
lm_scale_1.1 9.26
|
| 43 |
+
|
| 44 |
+
2022-08-16 19:01:59,299 INFO [decode.py:513] batch 0/?, cuts processed until now is 9
|
| 45 |
+
2022-08-16 19:03:57,721 INFO [decode.py:513] batch 100/?, cuts processed until now is 1400
|
| 46 |
+
2022-08-16 19:05:52,745 INFO [decode.py:513] batch 200/?, cuts processed until now is 2898
|
| 47 |
+
2022-08-16 19:05:56,000 INFO [decode.py:535] The transcripts are stored in lightweight_ctc/exp_phone/decode-nbest-rescoring/recogs-test-other-lm_scale_0.5.txt
|
| 48 |
+
2022-08-16 19:05:56,066 INFO [utils.py:428] [test-other-lm_scale_0.5] %WER 25.46% [13328 / 52343, 817 ins, 3576 del, 8935 sub ]
|
| 49 |
+
2022-08-16 19:05:56,232 INFO [decode.py:547] Wrote detailed error stats to lightweight_ctc/exp_phone/decode-nbest-rescoring/errs-test-other-lm_scale_0.5.txt
|
| 50 |
+
2022-08-16 19:05:56,261 INFO [decode.py:535] The transcripts are stored in lightweight_ctc/exp_phone/decode-nbest-rescoring/recogs-test-other-lm_scale_0.6.txt
|
| 51 |
+
2022-08-16 19:05:56,322 INFO [utils.py:428] [test-other-lm_scale_0.6] %WER 25.15% [13162 / 52343, 761 ins, 3712 del, 8689 sub ]
|
| 52 |
+
2022-08-16 19:05:56,488 INFO [decode.py:547] Wrote detailed error stats to lightweight_ctc/exp_phone/decode-nbest-rescoring/errs-test-other-lm_scale_0.6.txt
|
| 53 |
+
2022-08-16 19:05:56,516 INFO [decode.py:535] The transcripts are stored in lightweight_ctc/exp_phone/decode-nbest-rescoring/recogs-test-other-lm_scale_0.7.txt
|
| 54 |
+
2022-08-16 19:05:56,575 INFO [utils.py:428] [test-other-lm_scale_0.7] %WER 24.94% [13053 / 52343, 704 ins, 3901 del, 8448 sub ]
|
| 55 |
+
2022-08-16 19:05:56,739 INFO [decode.py:547] Wrote detailed error stats to lightweight_ctc/exp_phone/decode-nbest-rescoring/errs-test-other-lm_scale_0.7.txt
|
| 56 |
+
2022-08-16 19:05:56,768 INFO [decode.py:535] The transcripts are stored in lightweight_ctc/exp_phone/decode-nbest-rescoring/recogs-test-other-lm_scale_0.8.txt
|
| 57 |
+
2022-08-16 19:05:56,894 INFO [utils.py:428] [test-other-lm_scale_0.8] %WER 24.97% [13072 / 52343, 643 ins, 4155 del, 8274 sub ]
|
| 58 |
+
2022-08-16 19:05:57,055 INFO [decode.py:547] Wrote detailed error stats to lightweight_ctc/exp_phone/decode-nbest-rescoring/errs-test-other-lm_scale_0.8.txt
|
| 59 |
+
2022-08-16 19:05:57,083 INFO [decode.py:535] The transcripts are stored in lightweight_ctc/exp_phone/decode-nbest-rescoring/recogs-test-other-lm_scale_0.9.txt
|
| 60 |
+
2022-08-16 19:05:57,141 INFO [utils.py:428] [test-other-lm_scale_0.9] %WER 25.14% [13159 / 52343, 589 ins, 4405 del, 8165 sub ]
|
| 61 |
+
2022-08-16 19:05:57,302 INFO [decode.py:547] Wrote detailed error stats to lightweight_ctc/exp_phone/decode-nbest-rescoring/errs-test-other-lm_scale_0.9.txt
|
| 62 |
+
2022-08-16 19:05:57,333 INFO [decode.py:535] The transcripts are stored in lightweight_ctc/exp_phone/decode-nbest-rescoring/recogs-test-other-lm_scale_1.0.txt
|
| 63 |
+
2022-08-16 19:05:57,391 INFO [utils.py:428] [test-other-lm_scale_1.0] %WER 25.40% [13294 / 52343, 548 ins, 4655 del, 8091 sub ]
|
| 64 |
+
2022-08-16 19:05:57,551 INFO [decode.py:547] Wrote detailed error stats to lightweight_ctc/exp_phone/decode-nbest-rescoring/errs-test-other-lm_scale_1.0.txt
|
| 65 |
+
2022-08-16 19:05:57,579 INFO [decode.py:535] The transcripts are stored in lightweight_ctc/exp_phone/decode-nbest-rescoring/recogs-test-other-lm_scale_1.1.txt
|
| 66 |
+
2022-08-16 19:05:57,638 INFO [utils.py:428] [test-other-lm_scale_1.1] %WER 25.62% [13411 / 52343, 496 ins, 4910 del, 8005 sub ]
|
| 67 |
+
2022-08-16 19:05:57,864 INFO [decode.py:547] Wrote detailed error stats to lightweight_ctc/exp_phone/decode-nbest-rescoring/errs-test-other-lm_scale_1.1.txt
|
| 68 |
+
2022-08-16 19:05:57,868 INFO [decode.py:563]
|
| 69 |
+
For test-other, WER of different settings are:
|
| 70 |
+
lm_scale_0.7 24.94 best for test-other
|
| 71 |
+
lm_scale_0.8 24.97
|
| 72 |
+
lm_scale_0.9 25.14
|
| 73 |
+
lm_scale_0.6 25.15
|
| 74 |
+
lm_scale_1.0 25.4
|
| 75 |
+
lm_scale_0.5 25.46
|
| 76 |
+
lm_scale_1.1 25.62
|
| 77 |
+
|
| 78 |
+
2022-08-16 19:05:57,868 INFO [decode.py:783] Done!
|
decoding-results/nbest-rescoring/recogs-test-clean-lm_scale_0.7.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
decoding-results/nbest-rescoring/recogs-test-other-lm_scale_0.7.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
decoding-results/one-best/errs-test-clean-no_rescore.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
decoding-results/one-best/errs-test-other-no_rescore.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
decoding-results/one-best/log-decode-2022-08-16-18-55-20
ADDED
|
@@ -0,0 +1,29 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
2022-08-16 18:55:20,583 INFO [decode.py:579] Decoding started
|
| 2 |
+
2022-08-16 18:55:20,583 INFO [decode.py:580] {'subsampling_factor': 4, 'feature_dim': 80, 'search_beam': 20, 'output_beam': 8, 'min_active_states': 30, 'max_active_states': 10000, 'use_double_scores': True, 'env_info': {'k2-version': '1.18', 'k2-build-type': 'Release', 'k2-with-cuda': True, 'k2-git-sha1': '2d82a1d9350263ae48a6953034ce570e3d5208c1', 'k2-git-date': 'Mon Aug 15 02:09:05 2022', 'lhotse-version': '1.4.0.dev+git.94e9ed9.clean', 'torch-version': '1.11.0', 'torch-cuda-available': True, 'torch-cuda-version': '11.3', 'python-version': '3.8', 'icefall-git-branch': 'lightweight', 'icefall-git-sha1': 'eb99d97-dirty', 'icefall-git-date': 'Tue Aug 16 16:04:39 2022', 'icefall-path': '/thspfs/home/acct-hpc/thspzh-hpc1/git/icefall_dev', 'k2-path': '/raid/conda/envs/k2a100/lib/python3.8/site-packages/k2/__init__.py', 'lhotse-path': '/raid/conda/envs/k2a100/lib/python3.8/site-packages/lhotse/__init__.py', 'hostname': 'dgx-04.cluster.thspzh.com', 'IP address': '192.168.200.39'}, 'epoch': 9999, 'iter': 0, 'avg': 1, 'method': '1best', 'use_averaged_model': False, 'num_paths': 50, 'nbest_scale': 1.0, 'exp_dir': PosixPath('lightweight_ctc/exp_phone'), 'lang_dir': PosixPath('data/lang_phone'), 'lm_dir': PosixPath('data/lm'), 'first_out_channels': 8, 'conv_blocks': 3, 'rnn_dim': 0, 'full_libri': True, 'manifest_dir': PosixPath('data/fbank'), 'max_duration': 100, 'bucketing_sampler': True, 'num_buckets': 30, 'concatenate_cuts': False, 'duration_factor': 1.0, 'gap': 1.0, 'on_the_fly_feats': False, 'shuffle': True, 'drop_last': True, 'return_cuts': True, 'num_workers': 2, 'enable_spec_aug': True, 'spec_aug_time_warp_factor': 80, 'enable_musan': True, 'input_strategy': 'PrecomputedFeatures'}
|
| 3 |
+
2022-08-16 18:55:20,838 INFO [lexicon.py:176] Loading pre-compiled data/lang_phone/Linv.pt
|
| 4 |
+
2022-08-16 18:55:21,200 INFO [decode.py:590] device: cuda:0
|
| 5 |
+
2022-08-16 18:55:47,461 INFO [checkpoint.py:112] Loading checkpoint from lightweight_ctc/exp_phone/epoch-9999.pt
|
| 6 |
+
2022-08-16 18:55:47,774 INFO [decode.py:752] Number of model parameters: 1766904
|
| 7 |
+
2022-08-16 18:55:47,774 INFO [asr_datamodule.py:444] About to get test-clean cuts
|
| 8 |
+
2022-08-16 18:55:47,808 INFO [asr_datamodule.py:451] About to get test-other cuts
|
| 9 |
+
2022-08-16 18:55:50,321 INFO [decode.py:513] batch 0/?, cuts processed until now is 7
|
| 10 |
+
2022-08-16 18:56:07,871 INFO [decode.py:513] batch 100/?, cuts processed until now is 1218
|
| 11 |
+
2022-08-16 18:56:22,985 INFO [decode.py:513] batch 200/?, cuts processed until now is 2525
|
| 12 |
+
2022-08-16 18:56:23,773 INFO [decode.py:535] The transcripts are stored in lightweight_ctc/exp_phone/decode-1best/recogs-test-clean-no_rescore.txt
|
| 13 |
+
2022-08-16 18:56:23,829 INFO [utils.py:428] [test-clean-no_rescore] %WER 11.10% [5836 / 52576, 298 ins, 1670 del, 3868 sub ]
|
| 14 |
+
2022-08-16 18:56:23,979 INFO [decode.py:547] Wrote detailed error stats to lightweight_ctc/exp_phone/decode-1best/errs-test-clean-no_rescore.txt
|
| 15 |
+
2022-08-16 18:56:23,985 INFO [decode.py:563]
|
| 16 |
+
For test-clean, WER of different settings are:
|
| 17 |
+
no_rescore 11.1 best for test-clean
|
| 18 |
+
|
| 19 |
+
2022-08-16 18:56:24,729 INFO [decode.py:513] batch 0/?, cuts processed until now is 9
|
| 20 |
+
2022-08-16 18:56:35,677 INFO [decode.py:513] batch 100/?, cuts processed until now is 1400
|
| 21 |
+
2022-08-16 18:56:46,220 INFO [decode.py:513] batch 200/?, cuts processed until now is 2898
|
| 22 |
+
2022-08-16 18:56:46,748 INFO [decode.py:535] The transcripts are stored in lightweight_ctc/exp_phone/decode-1best/recogs-test-other-no_rescore.txt
|
| 23 |
+
2022-08-16 18:56:46,808 INFO [utils.py:428] [test-other-no_rescore] %WER 28.49% [14915 / 52343, 432 ins, 5911 del, 8572 sub ]
|
| 24 |
+
2022-08-16 18:56:46,972 INFO [decode.py:547] Wrote detailed error stats to lightweight_ctc/exp_phone/decode-1best/errs-test-other-no_rescore.txt
|
| 25 |
+
2022-08-16 18:56:46,975 INFO [decode.py:563]
|
| 26 |
+
For test-other, WER of different settings are:
|
| 27 |
+
no_rescore 28.49 best for test-other
|
| 28 |
+
|
| 29 |
+
2022-08-16 18:56:46,975 INFO [decode.py:783] Done!
|
decoding-results/one-best/recogs-test-clean-no_rescore.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
decoding-results/one-best/recogs-test-other-no_rescore.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
decoding-results/whole-lattice-rescoring/errs-test-clean-lm_scale_0.8.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
decoding-results/whole-lattice-rescoring/errs-test-other-lm_scale_0.8.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
decoding-results/whole-lattice-rescoring/log-decode-2022-08-16-19-11-22
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
decoding-results/whole-lattice-rescoring/recogs-test-clean-lm_scale_0.8.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
decoding-results/whole-lattice-rescoring/recogs-test-other-lm_scale_0.8.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
tensorboard_log/events.out.tfevents.1659925381.dgxs-01.cluster.thspzh.com.18736.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9dd26f857f5b14ce7ec6e593deb589ac9185301052d1abe4e9f4d907752db206
|
| 3 |
+
size 16422
|
tensorboard_log/events.out.tfevents.1659926695.dgxs-01.cluster.thspzh.com.27410.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8a7eb0172864cee90bf56d7dcce1dfa4acfd1a9ed7dd925c59c1127ec0ecb7a2
|
| 3 |
+
size 16422
|
tensorboard_log/events.out.tfevents.1659927762.dgxs-01.cluster.thspzh.com.34561.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:11f12dd44388e3d06bcebf44335a6f306bfd8630ee1e7757190256536aa6df36
|
| 3 |
+
size 16422
|
tensorboard_log/events.out.tfevents.1659928526.dgxs-01.cluster.thspzh.com.39902.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ec03256c2ae37aafacc51bc6488819ec542ef73d8c49d807eade3c5b9be4ba86
|
| 3 |
+
size 16422
|
tensorboard_log/events.out.tfevents.1659929206.dgxs-01.cluster.thspzh.com.4352.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d88a6ad0c29daca178985d8f0c249e567ebd0b11d351521300fd096282541b8e
|
| 3 |
+
size 16422
|
tensorboard_log/events.out.tfevents.1659930110.dgxs-01.cluster.thspzh.com.10312.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e48d0b5cb56393b681d93ee056d31be884315089e9f1b7ebc4b902692df80244
|
| 3 |
+
size 129066
|
tensorboard_log/events.out.tfevents.1659931044.dgxs-01.cluster.thspzh.com.16831.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6f516811d43fe0e65156d15f43a99282f428439962ec18be3062d63368ba16ba
|
| 3 |
+
size 8613
|
tensorboard_log/events.out.tfevents.1659940194.dgxs-01.cluster.thspzh.com.37638.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:79cff4276e624b7469a0bf61f1c9288e999d004c5d0de765c63924e7ed6cd263
|
| 3 |
+
size 3496
|
tensorboard_log/events.out.tfevents.1659941396.dgxs-01.cluster.thspzh.com.5637.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0509af9d9019f0c39e9927e68abbb68dbe9a5424c63a0e27ce7f0e0998626e27
|
| 3 |
+
size 558835
|
tensorboard_log/events.out.tfevents.1660034714.dgxs-01.cluster.thspzh.com.3516.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:54b016c9191ca208a2bf031f1b2e86f8488e85ae16a4468b91b496981fd75fc8
|
| 3 |
+
size 55828
|
tensorboard_log/events.out.tfevents.1660179164.dgxs-01.cluster.thspzh.com.14444.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b2d4e8624825a46d412df077f54e24ce043d7fbfa1a3b7c9f8380dd8d1270540
|
| 3 |
+
size 83916
|
tensorboard_log/events.out.tfevents.1660215232.dgxs-01.cluster.thspzh.com.3323.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ba6ee1e1a8108e0a0680217955df8a49fef28ff72c286bf30feb66edcfe2fad0
|
| 3 |
+
size 111126
|