longdnk commited on
Commit
59d5990
·
verified ·
1 Parent(s): 396d73a

Upload 12 files

Browse files
config.json CHANGED
@@ -78,7 +78,7 @@
78
  "num_hidden_layers": 24,
79
  "num_negatives": 100,
80
  "output_hidden_size": 1024,
81
- "pad_token_id": 0,
82
  "proj_codevector_dim": 768,
83
  "tdnn_dilation": [
84
  1,
@@ -104,7 +104,7 @@
104
  "torch_dtype": "float32",
105
  "transformers_version": "4.44.2",
106
  "use_weighted_layer_sum": false,
107
- "vocab_size": 706,
108
  "xvector_output_dim": 512,
109
  "gradient_checkpointing": true
110
  }
 
78
  "num_hidden_layers": 24,
79
  "num_negatives": 100,
80
  "output_hidden_size": 1024,
81
+ "pad_token_id": 109,
82
  "proj_codevector_dim": 768,
83
  "tdnn_dilation": [
84
  1,
 
104
  "torch_dtype": "float32",
105
  "transformers_version": "4.44.2",
106
  "use_weighted_layer_sum": false,
107
+ "vocab_size": 112,
108
  "xvector_output_dim": 512,
109
  "gradient_checkpointing": true
110
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:59d5168fc368c9867328200624f48cd61e0cd359dc8fa63f7cf6f52e524fa5cf
3
- size 1264702096
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:968ba954eb81788a989a006204d06ca7d52d55927a7a86e47f20690a66079b19
3
+ size 1262266680
optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e39159be60117a819e966813c4463e8cc047b65885df69f01d424fb2d06905f4
3
- size 2495948982
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b4d81a5b608612048bd9f92eecc1e4c742674dcd2cafe044c04431010ad5849
3
+ size 2491078198
preprocessor_config.json CHANGED
@@ -4,6 +4,6 @@
4
  "feature_size": 1,
5
  "padding_side": "right",
6
  "padding_value": 0.0,
7
- "return_attention_mask": true,
8
  "sampling_rate": 16000
9
  }
 
4
  "feature_size": 1,
5
  "padding_side": "right",
6
  "padding_value": 0.0,
7
+ "return_attention_mask": false,
8
  "sampling_rate": 16000
9
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0f7fd1fbb51e7513603571774ca0fc7e59957d504c5d26890b5fb4d0c60d1ccb
3
- size 1264796970
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6652aafede63e06daaf7684c1ea4d8ead8cf0e968811c3c6abc1aa8ccfd2adc
3
+ size 1262361578
rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ea2014619ab560562b67af3ac493f171046c4761b85b6e9309d2e81fe852477e
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:328397d773f82db3ef11fc5e40ca3a0bde89da51a612c1883347c8ebd80815ed
3
  size 14244
scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f4e35d7e4eefe7e8bb82e6ce1341473003d09c1f20b61a31153b813a7c9699bb
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0612c909f86715e3aa0b05de2507e957fdd12ee7b1a9ba818551018e1b0ab74
3
  size 1064
tokenizer_config.json CHANGED
@@ -1 +1 @@
1
- {"unk_token": "<unk>", "bos_token": "<s>", "eos_token": "</s>", "pad_token": "<pad>", "do_lower_case": true, "word_delimiter_token": "|", "tokenizer_class": "Wav2Vec2CTCTokenizer"}
 
1
+ {"unk_token": "<unk>", "bos_token": "<s>", "eos_token": "</s>", "pad_token": "<pad>", "do_lower_case": false, "word_delimiter_token": "|", "tokenizer_class": "Wav2Vec2CTCTokenizer"}
trainer_state.json CHANGED
@@ -1,298 +1,198 @@
1
  {
2
- "best_metric": 0.14590401947498322,
3
- "best_model_checkpoint": "./wav2vec2-base-demo/checkpoint-7000",
4
- "epoch": 3.0,
5
  "eval_steps": 500,
6
- "global_step": 7296,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 0.20559210526315788,
13
- "grad_norm": 3.5381269454956055,
14
- "learning_rate": 4.9800000000000004e-05,
15
- "loss": 0.1743,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 0.20559210526315788,
20
- "eval_cer": 0.034921636688755656,
21
- "eval_loss": 0.18684570491313934,
22
- "eval_mer": 0.2065967016491754,
23
- "eval_runtime": 67.8521,
24
- "eval_samples_per_second": 17.921,
25
- "eval_steps_per_second": 2.24,
26
- "eval_wer": 0.2089778586593873,
27
- "eval_wil": 0.3545466865428919,
28
- "eval_wip": 0.6454533134571081,
29
  "step": 500
30
  },
31
  {
32
  "epoch": 0.41118421052631576,
33
- "grad_norm": 6.306856632232666,
34
- "learning_rate": 4.6350794585050035e-05,
35
- "loss": 0.0802,
36
  "step": 1000
37
  },
38
  {
39
  "epoch": 0.41118421052631576,
40
- "eval_cer": 0.03683601556747659,
41
- "eval_loss": 0.1974627524614334,
42
- "eval_mer": 0.21781883194278903,
43
- "eval_runtime": 67.6807,
44
- "eval_samples_per_second": 17.967,
45
- "eval_steps_per_second": 2.246,
46
- "eval_wer": 0.22171671216257202,
47
- "eval_wil": 0.370112069660566,
48
- "eval_wip": 0.629887930339434,
49
  "step": 1000
50
  },
51
  {
52
  "epoch": 0.6167763157894737,
53
- "grad_norm": 2.544262170791626,
54
- "learning_rate": 4.267216009417305e-05,
55
- "loss": 0.0906,
56
  "step": 1500
57
  },
58
  {
59
  "epoch": 0.6167763157894737,
60
- "eval_cer": 0.0364152729567687,
61
- "eval_loss": 0.19286103546619415,
62
- "eval_mer": 0.21439325504366155,
63
- "eval_runtime": 68.1787,
64
- "eval_samples_per_second": 17.835,
65
- "eval_steps_per_second": 2.229,
66
- "eval_wer": 0.21595389748255991,
67
- "eval_wil": 0.3649436812657537,
68
- "eval_wip": 0.6350563187342463,
69
  "step": 1500
70
  },
71
  {
72
  "epoch": 0.8223684210526315,
73
- "grad_norm": 1.637362003326416,
74
- "learning_rate": 3.899352560329606e-05,
75
- "loss": 0.0906,
76
  "step": 2000
77
  },
78
  {
79
  "epoch": 0.8223684210526315,
80
- "eval_cer": 0.03565793625749448,
81
- "eval_loss": 0.1944369077682495,
82
- "eval_mer": 0.2094980462879471,
83
- "eval_runtime": 68.3994,
84
- "eval_samples_per_second": 17.778,
85
- "eval_steps_per_second": 2.222,
86
- "eval_wer": 0.21140430694570822,
87
- "eval_wil": 0.36077467429718857,
88
- "eval_wip": 0.6392253257028114,
89
  "step": 2000
90
  },
91
  {
92
  "epoch": 1.0279605263157894,
93
- "grad_norm": 3.4802608489990234,
94
- "learning_rate": 3.531489111241907e-05,
95
- "loss": 0.0985,
96
  "step": 2500
97
  },
98
  {
99
  "epoch": 1.0279605263157894,
100
- "eval_cer": 0.036352161565162515,
101
- "eval_loss": 0.19166675209999084,
102
- "eval_mer": 0.21280432822362488,
103
- "eval_runtime": 68.4199,
104
- "eval_samples_per_second": 17.773,
105
- "eval_steps_per_second": 2.222,
106
- "eval_wer": 0.21474067333939945,
107
- "eval_wil": 0.36261491061392714,
108
- "eval_wip": 0.6373850893860729,
109
  "step": 2500
110
  },
111
  {
112
  "epoch": 1.2335526315789473,
113
- "grad_norm": 0.283843457698822,
114
- "learning_rate": 3.164361389052384e-05,
115
- "loss": 0.1068,
116
  "step": 3000
117
  },
118
  {
119
  "epoch": 1.2335526315789473,
120
- "eval_cer": 0.03828757757441885,
121
- "eval_loss": 0.18938006460666656,
122
- "eval_mer": 0.21145770845830833,
123
- "eval_runtime": 68.2854,
124
- "eval_samples_per_second": 17.808,
125
- "eval_steps_per_second": 2.226,
126
- "eval_wer": 0.21383075523202913,
127
- "eval_wil": 0.3626201178125853,
128
- "eval_wip": 0.6373798821874147,
129
  "step": 3000
130
  },
131
  {
132
  "epoch": 1.4391447368421053,
133
- "grad_norm": 0.6021267175674438,
134
- "learning_rate": 2.796497939964685e-05,
135
- "loss": 0.1167,
136
  "step": 3500
137
  },
138
  {
139
  "epoch": 1.4391447368421053,
140
- "eval_cer": 0.03631008730409172,
141
- "eval_loss": 0.18041005730628967,
142
- "eval_mer": 0.2038369304556355,
143
- "eval_runtime": 68.6106,
144
- "eval_samples_per_second": 17.723,
145
- "eval_steps_per_second": 2.215,
146
- "eval_wer": 0.2062481043372763,
147
- "eval_wil": 0.3498563697078465,
148
- "eval_wip": 0.6501436302921535,
149
  "step": 3500
150
  },
151
  {
152
  "epoch": 1.6447368421052633,
153
- "grad_norm": 1.866600513458252,
154
- "learning_rate": 2.4286344908769864e-05,
155
- "loss": 0.1465,
156
  "step": 4000
157
  },
158
  {
159
  "epoch": 1.6447368421052633,
160
- "eval_cer": 0.035678973388029875,
161
- "eval_loss": 0.17490962147712708,
162
- "eval_mer": 0.21139430284857572,
163
- "eval_runtime": 68.4602,
164
- "eval_samples_per_second": 17.762,
165
- "eval_steps_per_second": 2.22,
166
- "eval_wer": 0.21383075523202913,
167
- "eval_wil": 0.361747028002243,
168
- "eval_wip": 0.638252971997757,
169
  "step": 4000
170
  },
171
  {
172
  "epoch": 1.850328947368421,
173
- "grad_norm": 3.364342451095581,
174
- "learning_rate": 2.060771041789288e-05,
175
- "loss": 0.1646,
176
  "step": 4500
177
  },
178
  {
179
  "epoch": 1.850328947368421,
180
- "eval_cer": 0.03382770590091511,
181
- "eval_loss": 0.16555456817150116,
182
- "eval_mer": 0.19957920048091374,
183
- "eval_runtime": 68.969,
184
- "eval_samples_per_second": 17.631,
185
- "eval_steps_per_second": 2.204,
186
- "eval_wer": 0.20139520776463452,
187
- "eval_wil": 0.3432318531535724,
188
- "eval_wip": 0.6567681468464276,
189
  "step": 4500
190
- },
191
- {
192
- "epoch": 2.0559210526315788,
193
- "grad_norm": 0.8766089081764221,
194
- "learning_rate": 1.6929075927015892e-05,
195
- "loss": 0.2085,
196
- "step": 5000
197
- },
198
- {
199
- "epoch": 2.0559210526315788,
200
- "eval_cer": 0.03254444093825602,
201
- "eval_loss": 0.16022680699825287,
202
- "eval_mer": 0.19477006311992787,
203
- "eval_runtime": 68.7751,
204
- "eval_samples_per_second": 17.681,
205
- "eval_steps_per_second": 2.21,
206
- "eval_wer": 0.19654231119199272,
207
- "eval_wil": 0.3361269123473307,
208
- "eval_wip": 0.6638730876526693,
209
- "step": 5000
210
- },
211
- {
212
- "epoch": 2.2615131578947367,
213
- "grad_norm": 1.846457839012146,
214
- "learning_rate": 1.3250441436138904e-05,
215
- "loss": 0.2251,
216
- "step": 5500
217
- },
218
- {
219
- "epoch": 2.2615131578947367,
220
- "eval_cer": 0.032081624066477334,
221
- "eval_loss": 0.15790578722953796,
222
- "eval_mer": 0.19153407385169618,
223
- "eval_runtime": 68.7932,
224
- "eval_samples_per_second": 17.676,
225
- "eval_steps_per_second": 2.21,
226
- "eval_wer": 0.1935092508340916,
227
- "eval_wil": 0.32998754348071724,
228
- "eval_wip": 0.6700124565192828,
229
- "step": 5500
230
- },
231
- {
232
- "epoch": 2.4671052631578947,
233
- "grad_norm": 2.029787302017212,
234
- "learning_rate": 9.579164214243673e-06,
235
- "loss": 0.2536,
236
- "step": 6000
237
- },
238
- {
239
- "epoch": 2.4671052631578947,
240
- "eval_cer": 0.03176606710844641,
241
- "eval_loss": 0.1529688686132431,
242
- "eval_mer": 0.1864864864864865,
243
- "eval_runtime": 68.9337,
244
- "eval_samples_per_second": 17.64,
245
- "eval_steps_per_second": 2.205,
246
- "eval_wer": 0.18835304822565968,
247
- "eval_wil": 0.3217957824380815,
248
- "eval_wip": 0.6782042175619185,
249
- "step": 6000
250
- },
251
- {
252
- "epoch": 2.6726973684210527,
253
- "grad_norm": 1.3223768472671509,
254
- "learning_rate": 5.9005297233666865e-06,
255
- "loss": 0.256,
256
- "step": 6500
257
- },
258
- {
259
- "epoch": 2.6726973684210527,
260
- "eval_cer": 0.03210266119701273,
261
- "eval_loss": 0.14946776628494263,
262
- "eval_mer": 0.18665464382326422,
263
- "eval_runtime": 69.3182,
264
- "eval_samples_per_second": 17.542,
265
- "eval_steps_per_second": 2.193,
266
- "eval_wer": 0.18835304822565968,
267
- "eval_wil": 0.3214362861329648,
268
- "eval_wip": 0.6785637138670352,
269
- "step": 6500
270
- },
271
- {
272
- "epoch": 2.8782894736842106,
273
- "grad_norm": 1.6771504878997803,
274
- "learning_rate": 2.2218952324896997e-06,
275
- "loss": 0.2895,
276
- "step": 7000
277
- },
278
- {
279
- "epoch": 2.8782894736842106,
280
- "eval_cer": 0.031555695803092455,
281
- "eval_loss": 0.14590401947498322,
282
- "eval_mer": 0.18665464382326422,
283
- "eval_runtime": 68.8491,
284
- "eval_samples_per_second": 17.662,
285
- "eval_steps_per_second": 2.208,
286
- "eval_wer": 0.18835304822565968,
287
- "eval_wil": 0.32247131315228605,
288
- "eval_wip": 0.677528686847714,
289
- "step": 7000
290
  }
291
  ],
292
  "logging_steps": 500,
293
- "max_steps": 7296,
294
  "num_input_tokens_seen": 0,
295
- "num_train_epochs": 3,
296
  "save_steps": 500,
297
  "stateful_callbacks": {
298
  "TrainerControl": {
@@ -306,7 +206,7 @@
306
  "attributes": {}
307
  }
308
  },
309
- "total_flos": 9.992785283464022e+18,
310
  "train_batch_size": 10,
311
  "trial_name": null,
312
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.410082072019577,
3
+ "best_model_checkpoint": "./wav2vec2-base-demo/checkpoint-4500",
4
+ "epoch": 2.0,
5
  "eval_steps": 500,
6
+ "global_step": 4864,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
  "epoch": 0.20559210526315788,
13
+ "grad_norm": 2.2851061820983887,
14
+ "learning_rate": 9.92e-05,
15
+ "loss": 6.3008,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 0.20559210526315788,
20
+ "eval_cer": 0.4373788489578866,
21
+ "eval_loss": 1.7558605670928955,
22
+ "eval_mer": 0.9513371639355891,
23
+ "eval_runtime": 65.8205,
24
+ "eval_samples_per_second": 18.474,
25
+ "eval_steps_per_second": 2.309,
26
+ "eval_wer": 0.9642651711245327,
27
+ "eval_wil": 0.9974733905930386,
28
+ "eval_wip": 0.0025266094069613973,
29
  "step": 500
30
  },
31
  {
32
  "epoch": 0.41118421052631576,
33
+ "grad_norm": 5.61221981048584,
34
+ "learning_rate": 8.863428047662696e-05,
35
+ "loss": 1.5187,
36
  "step": 1000
37
  },
38
  {
39
  "epoch": 0.41118421052631576,
40
+ "eval_cer": 0.2543099751265117,
41
+ "eval_loss": 0.9000231027603149,
42
+ "eval_mer": 0.6188369152970923,
43
+ "eval_runtime": 65.6413,
44
+ "eval_samples_per_second": 18.525,
45
+ "eval_steps_per_second": 2.316,
46
+ "eval_wer": 0.6335202761000863,
47
+ "eval_wil": 0.8495129479550749,
48
+ "eval_wip": 0.15048705204492513,
49
  "step": 1000
50
  },
51
  {
52
  "epoch": 0.6167763157894737,
53
+ "grad_norm": 4.668437480926514,
54
+ "learning_rate": 7.717690192483959e-05,
55
+ "loss": 1.1029,
56
  "step": 1500
57
  },
58
  {
59
  "epoch": 0.6167763157894737,
60
+ "eval_cer": 0.2021271121022386,
61
+ "eval_loss": 0.6554998159408569,
62
+ "eval_mer": 0.517606886248844,
63
+ "eval_runtime": 65.6608,
64
+ "eval_samples_per_second": 18.519,
65
+ "eval_steps_per_second": 2.315,
66
+ "eval_wer": 0.5231521426517113,
67
+ "eval_wil": 0.761288669534403,
68
+ "eval_wip": 0.23871133046559703,
69
  "step": 1500
70
  },
71
  {
72
  "epoch": 0.8223684210526315,
73
+ "grad_norm": 2.166978597640991,
74
+ "learning_rate": 6.571952337305225e-05,
75
+ "loss": 0.9255,
76
  "step": 2000
77
  },
78
  {
79
  "epoch": 0.8223684210526315,
80
+ "eval_cer": 0.17296509134574148,
81
+ "eval_loss": 0.5555564761161804,
82
+ "eval_mer": 0.45592748554707013,
83
+ "eval_runtime": 65.6661,
84
+ "eval_samples_per_second": 18.518,
85
+ "eval_steps_per_second": 2.315,
86
+ "eval_wer": 0.45930399769916597,
87
+ "eval_wil": 0.6969698207016493,
88
+ "eval_wip": 0.3030301792983507,
89
  "step": 2000
90
  },
91
  {
92
  "epoch": 1.0279605263157894,
93
+ "grad_norm": 2.7115116119384766,
94
+ "learning_rate": 5.4262144821264894e-05,
95
+ "loss": 0.8406,
96
  "step": 2500
97
  },
98
  {
99
  "epoch": 1.0279605263157894,
100
+ "eval_cer": 0.15896732138262287,
101
+ "eval_loss": 0.5135647058486938,
102
+ "eval_mer": 0.4211276641243139,
103
+ "eval_runtime": 65.5965,
104
+ "eval_samples_per_second": 18.538,
105
+ "eval_steps_per_second": 2.317,
106
+ "eval_wer": 0.4247914869140063,
107
+ "eval_wil": 0.6576477316919521,
108
+ "eval_wip": 0.3423522683080479,
109
  "step": 2500
110
  },
111
  {
112
  "epoch": 1.2335526315789473,
113
+ "grad_norm": 1.5140825510025024,
114
+ "learning_rate": 4.280476626947755e-05,
115
+ "loss": 0.7712,
116
  "step": 3000
117
  },
118
  {
119
  "epoch": 1.2335526315789473,
120
+ "eval_cer": 0.14858907281928124,
121
+ "eval_loss": 0.46155768632888794,
122
+ "eval_mer": 0.3986003998857469,
123
+ "eval_runtime": 65.9142,
124
+ "eval_samples_per_second": 18.448,
125
+ "eval_steps_per_second": 2.306,
126
+ "eval_wer": 0.4013517400057521,
127
+ "eval_wil": 0.6301973374782048,
128
+ "eval_wip": 0.3698026625217952,
129
  "step": 3000
130
  },
131
  {
132
  "epoch": 1.4391447368421053,
133
+ "grad_norm": 2.8752684593200684,
134
+ "learning_rate": 3.13473877176902e-05,
135
+ "loss": 0.7388,
136
  "step": 3500
137
  },
138
  {
139
  "epoch": 1.4391447368421053,
140
+ "eval_cer": 0.1433570632129685,
141
+ "eval_loss": 0.4430878758430481,
142
+ "eval_mer": 0.38519734494325886,
143
+ "eval_runtime": 65.6104,
144
+ "eval_samples_per_second": 18.534,
145
+ "eval_steps_per_second": 2.317,
146
+ "eval_wer": 0.38805004314063846,
147
+ "eval_wil": 0.6145415380151382,
148
+ "eval_wip": 0.3854584619848617,
149
  "step": 3500
150
  },
151
  {
152
  "epoch": 1.6447368421052633,
153
+ "grad_norm": 1.5182979106903076,
154
+ "learning_rate": 1.9890009165902843e-05,
155
+ "loss": 0.6985,
156
  "step": 4000
157
  },
158
  {
159
  "epoch": 1.6447368421052633,
160
+ "eval_cer": 0.13584355433570633,
161
+ "eval_loss": 0.4212208688259125,
162
+ "eval_mer": 0.3683083511777302,
163
+ "eval_runtime": 65.61,
164
+ "eval_samples_per_second": 18.534,
165
+ "eval_steps_per_second": 2.317,
166
+ "eval_wer": 0.3710094909404659,
167
+ "eval_wil": 0.5935129857245404,
168
+ "eval_wip": 0.40648701427545963,
169
  "step": 4000
170
  },
171
  {
172
  "epoch": 1.850328947368421,
173
+ "grad_norm": 5.133316516876221,
174
+ "learning_rate": 8.43263061411549e-06,
175
+ "loss": 0.6796,
176
  "step": 4500
177
  },
178
  {
179
  "epoch": 1.850328947368421,
180
+ "eval_cer": 0.13092031906681534,
181
+ "eval_loss": 0.410082072019577,
182
+ "eval_mer": 0.35861182519280205,
183
+ "eval_runtime": 65.7038,
184
+ "eval_samples_per_second": 18.507,
185
+ "eval_steps_per_second": 2.313,
186
+ "eval_wer": 0.3610871440897325,
187
+ "eval_wil": 0.5812666176163659,
188
+ "eval_wip": 0.4187333823836341,
189
  "step": 4500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
190
  }
191
  ],
192
  "logging_steps": 500,
193
+ "max_steps": 4864,
194
  "num_input_tokens_seen": 0,
195
+ "num_train_epochs": 2,
196
  "save_steps": 500,
197
  "stateful_callbacks": {
198
  "TrainerControl": {
 
206
  "attributes": {}
207
  }
208
  },
209
+ "total_flos": 6.647538946149148e+18,
210
  "train_batch_size": 10,
211
  "trial_name": null,
212
  "trial_params": null
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0f19595b62bd018202e86747cdb04e2517c6738c2c3b9ffc72eafdd7ffdf892c
3
  size 5176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4198119a49d69bf1bd9588d18935fc8bc67c60ee84be7a6da6bc7b659766007c
3
  size 5176
vocab.json CHANGED
@@ -1,708 +1 @@
1
- {
2
- "<pad>": 0,
3
- "<s>": 1,
4
- "</s>": 2,
5
- "<unk>": 3,
6
- "|": 4,
7
- "a": 5,
8
- "á": 6,
9
- "à": 7,
10
- "ả": 8,
11
- "ã": 9,
12
- "ạ": 10,
13
- "e": 11,
14
- "é": 12,
15
- "è": 13,
16
- "ẻ": 14,
17
- "ẽ": 15,
18
- "ẹ": 16,
19
- "ê": 17,
20
- "ế": 18,
21
- "ề": 19,
22
- "ể": 20,
23
- "ễ": 21,
24
- "ệ": 22,
25
- "i": 23,
26
- "í": 24,
27
- "ì": 25,
28
- "ỉ": 26,
29
- "ĩ": 27,
30
- "ị": 28,
31
- "o": 29,
32
- "ó": 30,
33
- "ò": 31,
34
- "ỏ": 32,
35
- "õ": 33,
36
- "ọ": 34,
37
- "ơ": 35,
38
- "ớ": 36,
39
- "ờ": 37,
40
- "ở": 38,
41
- "ỡ": 39,
42
- "ợ": 40,
43
- "ô": 41,
44
- "ố": 42,
45
- "ồ": 43,
46
- "ổ": 44,
47
- "ỗ": 45,
48
- "ộ": 46,
49
- "u": 47,
50
- "ú": 48,
51
- "ù": 49,
52
- "ủ": 50,
53
- "ũ": 51,
54
- "ụ": 52,
55
- "ư": 53,
56
- "ứ": 54,
57
- "ừ": 55,
58
- "ử": 56,
59
- "ữ": 57,
60
- "ự": 58,
61
- "y": 59,
62
- "ỳ": 60,
63
- "ý": 61,
64
- "ỷ": 62,
65
- "ỹ": 63,
66
- "ỵ": 64,
67
- "ă": 65,
68
- "ắ": 66,
69
- "ằ": 67,
70
- "ẳ": 68,
71
- "ẵ": 69,
72
- "ặ": 70,
73
- "â": 71,
74
- "ấ": 72,
75
- "ầ": 73,
76
- "ẩ": 74,
77
- "ẫ": 75,
78
- "ậ": 76,
79
- "đ": 77,
80
- "q": 78,
81
- "w": 79,
82
- "r": 80,
83
- "t": 81,
84
- "p": 82,
85
- "s": 83,
86
- "d": 84,
87
- "f": 85,
88
- "g": 86,
89
- "h": 87,
90
- "j": 88,
91
- "k": 89,
92
- "l": 90,
93
- "z": 91,
94
- "x": 92,
95
- "c": 93,
96
- "v": 94,
97
- "b": 95,
98
- "n": 96,
99
- "m": 97,
100
- "th": 98,
101
- "ch": 99,
102
- "kh": 100,
103
- "ph": 101,
104
- "nh": 102,
105
- "gh": 103,
106
- "qu": 104,
107
- "ng": 105,
108
- "ngh": 106,
109
- "tr": 107,
110
- "ác": 108,
111
- "ạc": 109,
112
- "ai": 110,
113
- "ái": 111,
114
- "ài": 112,
115
- "ải": 113,
116
- "ãi": 114,
117
- "ại": 115,
118
- "am": 116,
119
- "ám": 117,
120
- "àm": 118,
121
- "ảm": 119,
122
- "ãm": 120,
123
- "ạm": 121,
124
- "an": 122,
125
- "án": 123,
126
- "àn": 124,
127
- "ản": 125,
128
- "ãn": 126,
129
- "ạn": 127,
130
- "ao": 128,
131
- "áo": 129,
132
- "ào": 130,
133
- "ảo": 131,
134
- "ão": 132,
135
- "ạo": 133,
136
- "au": 134,
137
- "áu": 135,
138
- "àu": 136,
139
- "ảu": 137,
140
- "ãu": 138,
141
- "ạu": 139,
142
- "áp": 140,
143
- "ạp": 141,
144
- "át": 142,
145
- "ạt": 143,
146
- "ay": 144,
147
- "áy": 145,
148
- "ày": 146,
149
- "ảy": 147,
150
- "ãy": 148,
151
- "ạy": 149,
152
- "ắc": 150,
153
- "ặc": 151,
154
- "ăm": 152,
155
- "ằm": 153,
156
- "ắm": 154,
157
- "ẳm": 155,
158
- "ẵm": 156,
159
- "ặm": 157,
160
- "ăn": 158,
161
- "ắn": 159,
162
- "ằn": 160,
163
- "ẳn": 161,
164
- "ẵn": 162,
165
- "ặn": 163,
166
- "ắp": 164,
167
- "ặp": 165,
168
- "ắt": 166,
169
- "ặt": 167,
170
- "ấc": 168,
171
- "ậc": 169,
172
- "âm": 170,
173
- "ấm": 171,
174
- "ầm": 172,
175
- "ẩm": 173,
176
- "ẫm": 174,
177
- "ậm": 175,
178
- "ân": 176,
179
- "ấn": 177,
180
- "ần": 178,
181
- "ẩn": 179,
182
- "ẫn": 180,
183
- "ận": 181,
184
- "ấp": 182,
185
- "ập": 183,
186
- "ất": 184,
187
- "ật": 185,
188
- "âu": 186,
189
- "ấu": 187,
190
- "ầu": 188,
191
- "ẩu": 189,
192
- "ẫu": 190,
193
- "ậu": 191,
194
- "ây": 192,
195
- "ấy": 193,
196
- "ầy": 194,
197
- "ẩy": 195,
198
- "ẫy": 196,
199
- "ậy": 197,
200
- "éc": 198,
201
- "ẹc": 199,
202
- "em": 200,
203
- "ém": 201,
204
- "èm": 202,
205
- "ẻm": 203,
206
- "ẽm": 204,
207
- "ẹm": 205,
208
- "en": 206,
209
- "én": 207,
210
- "èn": 208,
211
- "ẻn": 209,
212
- "ẽn": 210,
213
- "ẹn": 211,
214
- "eo": 212,
215
- "éo": 213,
216
- "èo": 214,
217
- "ẻo": 215,
218
- "ẽo": 216,
219
- "ẹo": 217,
220
- "ép": 218,
221
- "ẹp": 219,
222
- "ét": 220,
223
- "ẹt": 221,
224
- "êm": 222,
225
- "ếm": 223,
226
- "ềm": 224,
227
- "ễm": 225,
228
- "ệm": 226,
229
- "ên": 227,
230
- "ến": 228,
231
- "ền": 229,
232
- "ển": 230,
233
- "ện": 231,
234
- "ếp": 232,
235
- "ệp": 233,
236
- "ết": 234,
237
- "ệt": 235,
238
- "êu": 236,
239
- "ếu": 237,
240
- "ều": 238,
241
- "ểu": 239,
242
- "ễu": 240,
243
- "ệu": 241,
244
- "ia": 242,
245
- "ía": 243,
246
- "ìa": 244,
247
- "ỉa": 245,
248
- "ĩa": 246,
249
- "ịa": 247,
250
- "im": 248,
251
- "ím": 249,
252
- "ìm": 250,
253
- "ỉm": 251,
254
- "ĩm": 252,
255
- "ịm": 253,
256
- "in": 254,
257
- "ín": 255,
258
- "ìn": 256,
259
- "ỉn": 257,
260
- "ịn": 258,
261
- "íp": 259,
262
- "ịp": 260,
263
- "ít": 261,
264
- "ịt": 262,
265
- "iu": 263,
266
- "íu": 264,
267
- "ìu": 265,
268
- "ỉu": 266,
269
- "ĩu": 267,
270
- "ịu": 268,
271
- "oa": 269,
272
- "óa": 270,
273
- "òa": 271,
274
- "ỏa": 272,
275
- "õa": 273,
276
- "ọa": 274,
277
- "oà": 275,
278
- "óc": 276,
279
- "ọc": 277,
280
- "oe": 278,
281
- "óe": 279,
282
- "òe": 280,
283
- "ỏe": 281,
284
- "ọe": 282,
285
- "oẹ": 283,
286
- "oi": 284,
287
- "ói": 285,
288
- "òi": 286,
289
- "ỏi": 287,
290
- "õi": 288,
291
- "ọi": 289,
292
- "om": 290,
293
- "óm": 291,
294
- "òm": 292,
295
- "ỏm": 293,
296
- "õm": 294,
297
- "ọm": 295,
298
- "on": 296,
299
- "ón": 297,
300
- "òn": 298,
301
- "ỏn": 299,
302
- "õn": 300,
303
- "ọn": 301,
304
- "óp": 302,
305
- "ọp": 303,
306
- "ót": 304,
307
- "ọt": 305,
308
- "ốc": 306,
309
- "ộc": 307,
310
- "ôi": 308,
311
- "ối": 309,
312
- "ồi": 310,
313
- "ổi": 311,
314
- "ỗi": 312,
315
- "ội": 313,
316
- "ôm": 314,
317
- "ốm": 315,
318
- "ồm": 316,
319
- "ổm": 317,
320
- "ỗm": 318,
321
- "ộm": 319,
322
- "ôn": 320,
323
- "ốn": 321,
324
- "ồn": 322,
325
- "ổn": 323,
326
- "ỗn": 324,
327
- "ộn": 325,
328
- "ốp": 326,
329
- "ộp": 327,
330
- "ốt": 328,
331
- "ột": 329,
332
- "ơi": 330,
333
- "ới": 331,
334
- "ời": 332,
335
- "ởi": 333,
336
- "ỡi": 334,
337
- "ợi": 335,
338
- "ơm": 336,
339
- "ớm": 337,
340
- "ờm": 338,
341
- "ởm": 339,
342
- "ỡm": 340,
343
- "ợm": 341,
344
- "ơn": 342,
345
- "ớn": 343,
346
- "ờn": 344,
347
- "ởn": 345,
348
- "ỡn": 346,
349
- "ợn": 347,
350
- "ớp": 348,
351
- "ợp": 349,
352
- "ớt": 350,
353
- "ợt": 351,
354
- "ua": 352,
355
- "úa": 353,
356
- "ùa": 354,
357
- "ủa": 355,
358
- "ũa": 356,
359
- "ụa": 357,
360
- "úc": 358,
361
- "ục": 359,
362
- "uê": 360,
363
- "uế": 361,
364
- "uề": 362,
365
- "uể": 363,
366
- "uệ": 364,
367
- "ui": 365,
368
- "úi": 366,
369
- "ùi": 367,
370
- "ủi": 368,
371
- "ũi": 369,
372
- "ụi": 370,
373
- "um": 371,
374
- "úm": 372,
375
- "ùm": 373,
376
- "ủm": 374,
377
- "ũm": 375,
378
- "ụm": 376,
379
- "un": 377,
380
- "ún": 378,
381
- "ùn": 379,
382
- "ủn": 380,
383
- "ũn": 381,
384
- "ụn": 382,
385
- "úp": 383,
386
- "ụp": 384,
387
- "út": 385,
388
- "ụt": 386,
389
- "uy": 387,
390
- "úy": 388,
391
- "ùy": 389,
392
- "ủy": 390,
393
- "ũy": 391,
394
- "ụy": 392,
395
- "ưa": 393,
396
- "ứa": 394,
397
- "ừa": 395,
398
- "ửa": 396,
399
- "ữa": 397,
400
- "ựa": 398,
401
- "ức": 399,
402
- "ực": 400,
403
- "ửi": 401,
404
- "ừm": 402,
405
- "uơ": 403,
406
- "uở": 404,
407
- "ứt": 405,
408
- "ựt": 406,
409
- "ưu": 407,
410
- "ứu": 408,
411
- "ừu": 409,
412
- "ửu": 410,
413
- "ữu": 411,
414
- "ựu": 412,
415
- "sh": 413,
416
- "aw": 414,
417
- "ee": 415,
418
- "ea": 416,
419
- "ei": 417,
420
- "ew": 418,
421
- "eu": 419,
422
- "ie": 420,
423
- "oo": 421,
424
- "ou": 422,
425
- "ow": 423,
426
- "oy": 424,
427
- "ue": 425,
428
- "io": 426,
429
- "ách": 427,
430
- "ạch": 428,
431
- "ang": 429,
432
- "áng": 430,
433
- "àng": 431,
434
- "ảng": 432,
435
- "ãng": 433,
436
- "ạng": 434,
437
- "anh": 435,
438
- "ánh": 436,
439
- "ành": 437,
440
- "ảnh": 438,
441
- "ãnh": 439,
442
- "ạnh": 440,
443
- "ăng": 441,
444
- "ắng": 442,
445
- "ằng": 443,
446
- "ẳng": 444,
447
- "ẵng": 445,
448
- "ặng": 446,
449
- "âng": 447,
450
- "ấng": 448,
451
- "ầng": 449,
452
- "ẩng": 450,
453
- "ẫng": 451,
454
- "ậng": 452,
455
- "eng": 453,
456
- "éng": 454,
457
- "èng": 455,
458
- "ẻng": 456,
459
- "ếch": 457,
460
- "ệch": 458,
461
- "ênh": 459,
462
- "ếnh": 460,
463
- "ềnh": 461,
464
- "ểnh": 462,
465
- "ễnh": 463,
466
- "ệnh": 464,
467
- "ích": 465,
468
- "ịch": 466,
469
- "iếc": 467,
470
- "iệc": 468,
471
- "iêm": 469,
472
- "iếm": 470,
473
- "iềm": 471,
474
- "iểm": 472,
475
- "iễm": 473,
476
- "iệm": 474,
477
- "iên": 475,
478
- "iến": 476,
479
- "iền": 477,
480
- "iển": 478,
481
- "iễn": 479,
482
- "iện": 480,
483
- "iếp": 481,
484
- "iệp": 482,
485
- "iết": 483,
486
- "iệt": 484,
487
- "iêu": 485,
488
- "iếu": 486,
489
- "iều": 487,
490
- "iểu": 488,
491
- "iễu": 489,
492
- "iệu": 490,
493
- "inh": 491,
494
- "ính": 492,
495
- "ình": 493,
496
- "ỉnh": 494,
497
- "ĩnh": 495,
498
- "ịnh": 496,
499
- "oác": 497,
500
- "oạc": 498,
501
- "oai": 499,
502
- "oái": 500,
503
- "oài": 501,
504
- "oải": 502,
505
- "oãi": 503,
506
- "oại": 504,
507
- "oàm": 505,
508
- "oan": 506,
509
- "oán": 507,
510
- "oàn": 508,
511
- "oản": 509,
512
- "oãn": 510,
513
- "oạn": 511,
514
- "oao": 512,
515
- "oáo": 513,
516
- "oáp": 514,
517
- "oạp": 515,
518
- "oát": 516,
519
- "oạt": 517,
520
- "oay": 518,
521
- "oáy": 519,
522
- "oảy": 520,
523
- "oắc": 521,
524
- "oặc": 522,
525
- "oăm": 523,
526
- "oăn": 524,
527
- "oẳn": 525,
528
- "oắn": 526,
529
- "oằn": 527,
530
- "oắt": 528,
531
- "oặt": 529,
532
- "oen": 530,
533
- "oẻn": 531,
534
- "oeo": 532,
535
- "oéo": 533,
536
- "oèo": 534,
537
- "oẻo": 535,
538
- "oét": 536,
539
- "oẹt": 537,
540
- "ong": 538,
541
- "óng": 539,
542
- "òng": 540,
543
- "ỏng": 541,
544
- "õng": 542,
545
- "ọng": 543,
546
- "oóc": 544,
547
- "oọc": 545,
548
- "ông": 546,
549
- "ống": 547,
550
- "ồng": 548,
551
- "ổng": 549,
552
- "ỗng": 550,
553
- "ộng": 551,
554
- "uân": 552,
555
- "uấn": 553,
556
- "uần": 554,
557
- "uẩn": 555,
558
- "uẫn": 556,
559
- "uận": 557,
560
- "uất": 558,
561
- "uật": 559,
562
- "uây": 560,
563
- "uấy": 561,
564
- "uầy": 562,
565
- "ung": 563,
566
- "úng": 564,
567
- "ùng": 565,
568
- "ủng": 566,
569
- "ũng": 567,
570
- "ụng": 568,
571
- "uốc": 569,
572
- "uộc": 570,
573
- "uôi": 571,
574
- "uối": 572,
575
- "uồi": 573,
576
- "uổi": 574,
577
- "uỗi": 575,
578
- "uội": 576,
579
- "uôm": 577,
580
- "uốm": 578,
581
- "uồm": 579,
582
- "uỗm": 580,
583
- "uộm": 581,
584
- "uôn": 582,
585
- "uốn": 583,
586
- "uồn": 584,
587
- "uỗn": 585,
588
- "uộn": 586,
589
- "uốt": 587,
590
- "uột": 588,
591
- "uýt": 589,
592
- "uỵt": 590,
593
- "uya": 591,
594
- "uỷu": 592,
595
- "ưng": 593,
596
- "ứng": 594,
597
- "ừng": 595,
598
- "ửng": 596,
599
- "ững": 597,
600
- "ựng": 598,
601
- "ước": 599,
602
- "ược": 600,
603
- "ươi": 601,
604
- "ưới": 602,
605
- "ười": 603,
606
- "ưởi": 604,
607
- "ưỡi": 605,
608
- "ượi": 606,
609
- "ươm": 607,
610
- "ướm": 608,
611
- "ườm": 609,
612
- "ượm": 610,
613
- "ươn": 611,
614
- "ướn": 612,
615
- "ườn": 613,
616
- "ưỡn": 614,
617
- "ượn": 615,
618
- "ướp": 616,
619
- "ượp": 617,
620
- "ướt": 618,
621
- "ượt": 619,
622
- "ươu": 620,
623
- "ướu": 621,
624
- "ượu": 622,
625
- "yêm": 623,
626
- "yếm": 624,
627
- "yểm": 625,
628
- "yên": 626,
629
- "yến": 627,
630
- "yêu": 628,
631
- "yếu": 629,
632
- "yểu": 630,
633
- "yết": 631,
634
- "iêng": 632,
635
- "iếng": 633,
636
- "iềng": 634,
637
- "iểng": 635,
638
- "iễng": 636,
639
- "iệng": 637,
640
- "oách": 638,
641
- "oạch": 639,
642
- "oang": 640,
643
- "oáng": 641,
644
- "oàng": 642,
645
- "oảng": 643,
646
- "oãng": 644,
647
- "oạng": 645,
648
- "oanh": 646,
649
- "oánh": 647,
650
- "oành": 648,
651
- "oạnh": 649,
652
- "oảnh": 650,
653
- "oăng": 651,
654
- "oắng": 652,
655
- "oằng": 653,
656
- "oẳng": 654,
657
- "oong": 655,
658
- "uếch": 656,
659
- "uênh": 657,
660
- "uông": 658,
661
- "uống": 659,
662
- "uồng": 660,
663
- "uổng": 661,
664
- "uỗng": 662,
665
- "uộng": 663,
666
- "uých": 664,
667
- "uỵch": 665,
668
- "uyên": 666,
669
- "uyến": 667,
670
- "uyền": 668,
671
- "uyển": 669,
672
- "uyễn": 670,
673
- "uyện": 671,
674
- "uyết": 672,
675
- "uyệt": 673,
676
- "uynh": 674,
677
- "uỳnh": 675,
678
- "uýnh": 676,
679
- "uỷnh": 677,
680
- "ương": 678,
681
- "ướng": 679,
682
- "ường": 680,
683
- "ưởng": 681,
684
- "ưỡng": 682,
685
- "ượng": 683,
686
- "op": 684,
687
- "ot": 685,
688
- "gi": 686,
689
- "ap": 687,
690
- "at": 688,
691
- "ac": 689,
692
- "it": 690,
693
- "ip": 691,
694
- "ic": 692,
695
- "ep": 693,
696
- "et": 694,
697
- "ec": 695,
698
- "1": 696,
699
- "2": 697,
700
- "3": 698,
701
- "4": 699,
702
- "5": 700,
703
- "6": 701,
704
- "7": 702,
705
- "8": 703,
706
- "9": 704,
707
- "0": 705
708
- }
 
1
+ {"ẻ": 0, "6": 1, "ụ": 2, "í": 3, "3": 4, "ỹ": 5, "ý": 6, "ẩ": 7, "ở": 8, "ề": 9, "õ": 10, "7": 11, "ê": 12, "ứ": 13, "ỏ": 14, "v": 15, "ỷ": 16, "a": 17, "l": 18, "ự": 19, "q": 20, "ờ": 21, "j": 22, "ố": 23, "à": 24, "ỗ": 25, "n": 26, "é": 27, "ủ": 28, "у": 29, "ô": 30, "u": 31, "y": 32, "ằ": 33, "4": 34, "w": 35, "b": 36, "ệ": 37, "ễ": 38, "s": 39, "ì": 40, "ầ": 41, "ỵ": 42, "8": 43, "d": 44, "ể": 45, "r": 47, "ũ": 48, "c": 49, "ạ": 50, "9": 51, "ế": 52, "ù": 53, "ỡ": 54, "2": 55, "t": 56, "i": 57, "g": 58, "́": 59, "ử": 60, "̀": 61, "á": 62, "0": 63, "ậ": 64, "e": 65, "ộ": 66, "m": 67, "ẳ": 68, "ợ": 69, "ĩ": 70, "h": 71, "â": 72, "ú": 73, "ọ": 74, "ồ": 75, "ặ": 76, "f": 77, "ữ": 78, "ắ": 79, "ỳ": 80, "x": 81, "ó": 82, "ã": 83, "ổ": 84, "ị": 85, "̣": 86, "z": 87, "ả": 88, "đ": 89, "è": 90, "ừ": 91, "ò": 92, "ẵ": 93, "1": 94, "ơ": 95, "k": 96, "ẫ": 97, "p": 98, "ấ": 99, "ẽ": 100, "ỉ": 101, "ớ": 102, "ẹ": 103, "ă": 104, "o": 105, "ư": 106, "5": 107, "|": 46, "<unk>": 108, "<pad>": 109}