Yehor commited on
Commit
28ee5ca
·
verified ·
1 Parent(s): 2497622

Upload checkpoints epoch_0004_step_00080000

Browse files

Automatic checkpoint upload from train.py.

Report stem: epoch_0004_step_00080000
Epoch: 4
Global step: 80000

.hf_upload_sync/validation_epoch_0003.done ADDED
@@ -0,0 +1 @@
 
 
1
+ 1776438842.5521402
.hf_upload_sync/validation_epoch_0004_step_00080000.started ADDED
@@ -0,0 +1 @@
 
 
1
+ 1776440780.5114055
checkpoint_step_last.json CHANGED
@@ -116,126 +116,126 @@
116
  "feature_dim": 160,
117
  "padding_value": 1.0
118
  },
119
- "epoch": 3,
120
- "global_step": 70000,
121
  "best_val_wer": 0.2002018694869882,
122
  "metrics": {
123
- "epoch": 3,
124
- "global_step": 70000,
125
- "train_loss": 0.5679515531171964,
126
- "train_main_ctc_loss": 0.5679515531171964,
127
  "train_aed_loss": 0.0,
128
  "train_liberta_distill_loss": 0.0,
129
  "train_audio_teacher_loss": 0.0,
130
- "val_loss": 0.3990042791440246,
131
- "val_cer": 0.05228705349927267,
132
- "val_wer": 0.24808004564005792,
133
- "val_forward_seconds": 311.10390449501574,
134
  "val_teacher_seconds": 0.0,
135
- "val_decode_seconds": 0.9831855085212737,
136
- "val_gather_seconds": 0.0206975219771266,
137
  "val_model_source": "raw",
138
- "val_main_ctc_loss": 0.3990042791440246,
139
  "val_aed_loss": 0.0,
140
  "val_liberta_distill_loss": 0.0,
141
  "val_audio_teacher_loss": 0.0,
142
- "val_avg_blank_probability": 0.7959586015027048,
143
- "val_argmax_blank_fraction": 0.8018901517703331,
144
- "val_avg_top_nonblank_probability": 0.19443671218755104,
145
  "val_avg_output_frames": 129.72159800249688,
146
  "val_avg_target_tokens": 24.885455680399502,
147
  "val_target_tokens_per_frame": 0.1918374123013849,
148
  "val_impossible_sample_fraction": 0.0,
149
  "val_tight_sample_fraction": 0.0,
150
  "val_samples_short": 1183.0,
151
- "val_wer_short": 0.2962796952039444,
152
- "val_cer_short": 0.06460594952770336,
153
  "val_samples_medium": 2021.0,
154
- "val_wer_medium": 0.236343792633015,
155
- "val_cer_medium": 0.049377268640314366,
156
  "val_samples_long": 0.0,
157
  "val_decoded_empty_fraction": 0.0,
158
- "val_decoded_avg_char_length": 45.887016229712856,
159
- "val_decoded_avg_word_length": 7.069288389513108,
160
  "val_speaker_count": 0.0,
161
  "val_speaker_macro_wer": 0.0,
162
  "val_speaker_id_available": 0.0,
163
  "val_missing_speaker_id_samples": 3204.0,
164
- "val_hardest_example_0_id": "/home/yehor/squeezeformer/data/cv10-uk-testset-clean-punctuated/3201.wav",
165
  "val_hardest_example_0_speaker": "",
166
- "val_hardest_example_0_ref": "То й що?",
167
- "val_hardest_example_0_hyp": "— То що?",
168
- "val_hardest_example_1_id": "/home/yehor/squeezeformer/data/cv10-uk-testset-clean-punctuated/2465.wav",
169
  "val_hardest_example_1_speaker": "",
170
- "val_hardest_example_1_ref": "Але ви?",
171
- "val_hardest_example_1_hyp": "Але ви.",
172
- "val_hardest_example_2_id": "/home/yehor/squeezeformer/data/cv10-uk-testset-clean-punctuated/3561.wav",
173
  "val_hardest_example_2_speaker": "",
174
- "val_hardest_example_2_ref": "Двадцять три?",
175
- "val_hardest_example_2_hyp": "Двадцять три.",
176
- "val_hardest_example_3_id": "/home/yehor/squeezeformer/data/cv10-uk-testset-clean-punctuated/3394.wav",
177
  "val_hardest_example_3_speaker": "",
178
- "val_hardest_example_3_ref": "Ще раз?",
179
- "val_hardest_example_3_hyp": "Ще раз.",
180
- "val_hardest_example_4_id": "/home/yehor/squeezeformer/data/cv10-uk-testset-clean-punctuated/2306.wav",
181
  "val_hardest_example_4_speaker": "",
182
- "val_hardest_example_4_ref": "Попросіть.",
183
- "val_hardest_example_4_hyp": "Попрошіть.",
184
- "val_random_example_0_id": "/home/yehor/squeezeformer/data/cv10-uk-testset-clean-punctuated/710.wav",
185
  "val_random_example_0_speaker": "",
186
- "val_random_example_0_ref": "Зраду брата і брехливі доноси на ближнього сини перейняли у Невського.",
187
- "val_random_example_0_hyp": "Зраду брата і брехливі доносина ближнього сини перейняли у Невсьського.",
188
- "val_random_example_1_id": "/home/yehor/squeezeformer/data/cv10-uk-testset-clean-punctuated/2469.wav",
189
  "val_random_example_1_speaker": "",
190
- "val_random_example_1_ref": "Щоб довго не базікав тут.",
191
- "val_random_example_1_hyp": "Щоб довго не ба зікав тут.",
192
- "val_random_example_2_id": "/home/yehor/squeezeformer/data/cv10-uk-testset-clean-punctuated/3281.wav",
193
  "val_random_example_2_speaker": "",
194
- "val_random_example_2_ref": "Дехто їде возами за Гать.",
195
- "val_random_example_2_hyp": "Дехто їде возами загать?",
196
  "val_random_example_3_id": "/home/yehor/squeezeformer/data/cv10-uk-testset-clean-punctuated/3112.wav",
197
  "val_random_example_3_speaker": "",
198
  "val_random_example_3_ref": "Застосування мов в Україні гарантується Конституцією України та визначається законом.",
199
- "val_random_example_3_hyp": "Застосування мов враїні гарантується Конституцію Україниї та визначається законом",
200
- "val_random_example_4_id": "/home/yehor/squeezeformer/data/cv10-uk-testset-clean-punctuated/2744.wav",
201
  "val_random_example_4_speaker": "",
202
- "val_random_example_4_ref": "Кожен має право на тупість, але дехто цим правом зловживає.",
203
- "val_random_example_4_hyp": "Кожен має право на тупість, але дехто цим правом зловживе.",
204
- "val/loss": 0.3990042791440246,
205
- "val/cer": 0.05228705349927267,
206
- "val/wer": 0.24808004564005792,
207
- "val/main_ctc_loss": 0.3990042791440246,
208
  "val/aed_loss": 0.0,
209
  "val/liberta_distill_loss": 0.0,
210
  "val/audio_teacher_loss": 0.0,
211
- "val/avg_blank_probability": 0.7959586015027048,
212
- "val/argmax_blank_fraction": 0.8018901517703331,
213
- "val/avg_top_nonblank_probability": 0.19443671218755104,
214
  "val/avg_output_frames": 129.72159800249688,
215
  "val/avg_target_tokens": 24.885455680399502,
216
  "val/target_tokens_per_frame": 0.1918374123013849,
217
  "val/impossible_sample_fraction": 0.0,
218
  "val/tight_sample_fraction": 0.0,
219
  "val/samples_short": 1183.0,
220
- "val/wer_short": 0.2962796952039444,
221
- "val/cer_short": 0.06460594952770336,
222
  "val/samples_medium": 2021.0,
223
- "val/wer_medium": 0.236343792633015,
224
- "val/cer_medium": 0.049377268640314366,
225
  "val/samples_long": 0.0,
226
  "val/decoded_empty_fraction": 0.0,
227
- "val/decoded_avg_char_length": 45.887016229712856,
228
- "val/decoded_avg_word_length": 7.069288389513108,
229
  "val/speaker_count": 0.0,
230
  "val/speaker_macro_wer": 0.0,
231
  "val/speaker_id_available": 0.0,
232
  "val/missing_speaker_id_samples": 3204.0,
233
- "val/forward_seconds": 311.10390449501574,
234
  "val/teacher_seconds": 0.0,
235
- "val/decode_seconds": 0.9831855085212737,
236
- "val/gather_seconds": 0.0206975219771266,
237
- "train/loss": 0.5679515531171964,
238
- "train/main_ctc_loss": 0.5679515531171964,
239
  "train/aed_loss": 0.0,
240
  "train/liberta_distill_loss": 0.0,
241
  "train/audio_teacher_loss": 0.0
 
116
  "feature_dim": 160,
117
  "padding_value": 1.0
118
  },
119
+ "epoch": 4,
120
+ "global_step": 80000,
121
  "best_val_wer": 0.2002018694869882,
122
  "metrics": {
123
+ "epoch": 4,
124
+ "global_step": 80000,
125
+ "train_loss": 0.5720258672326572,
126
+ "train_main_ctc_loss": 0.5720258672326572,
127
  "train_aed_loss": 0.0,
128
  "train_liberta_distill_loss": 0.0,
129
  "train_audio_teacher_loss": 0.0,
130
+ "val_loss": 0.36097462281870185,
131
+ "val_cer": 0.045040676687678464,
132
+ "val_wer": 0.2181506999605038,
133
+ "val_forward_seconds": 301.635894693085,
134
  "val_teacher_seconds": 0.0,
135
+ "val_decode_seconds": 0.9517203441355377,
136
+ "val_gather_seconds": 5.703901747940108,
137
  "val_model_source": "raw",
138
+ "val_main_ctc_loss": 0.36097462281870185,
139
  "val_aed_loss": 0.0,
140
  "val_liberta_distill_loss": 0.0,
141
  "val_audio_teacher_loss": 0.0,
142
+ "val_avg_blank_probability": 0.794819268942859,
143
+ "val_argmax_blank_fraction": 0.800636626983745,
144
+ "val_avg_top_nonblank_probability": 0.19556051142716604,
145
  "val_avg_output_frames": 129.72159800249688,
146
  "val_avg_target_tokens": 24.885455680399502,
147
  "val_target_tokens_per_frame": 0.1918374123013849,
148
  "val_impossible_sample_fraction": 0.0,
149
  "val_tight_sample_fraction": 0.0,
150
  "val_samples_short": 1183.0,
151
+ "val_wer_short": 0.26064545047064097,
152
+ "val_cer_short": 0.0564993655716904,
153
  "val_samples_medium": 2021.0,
154
+ "val_wer_medium": 0.20780354706684856,
155
+ "val_cer_medium": 0.042334077058843116,
156
  "val_samples_long": 0.0,
157
  "val_decoded_empty_fraction": 0.0,
158
+ "val_decoded_avg_char_length": 46.24032459425718,
159
+ "val_decoded_avg_word_length": 7.117353308364544,
160
  "val_speaker_count": 0.0,
161
  "val_speaker_macro_wer": 0.0,
162
  "val_speaker_id_available": 0.0,
163
  "val_missing_speaker_id_samples": 3204.0,
164
+ "val_hardest_example_0_id": "/home/yehor/squeezeformer/data/cv10-uk-testset-clean-punctuated/1317.wav",
165
  "val_hardest_example_0_speaker": "",
166
+ "val_hardest_example_0_ref": "Чому я так кажу?",
167
+ "val_hardest_example_0_hyp": "Чому я это кажу?",
168
+ "val_hardest_example_1_id": "/home/yehor/squeezeformer/data/cv10-uk-testset-clean-punctuated/1920.wav",
169
  "val_hardest_example_1_speaker": "",
170
+ "val_hardest_example_1_ref": "Дякую.",
171
+ "val_hardest_example_1_hyp": "Дякую!",
172
+ "val_hardest_example_2_id": "/home/yehor/squeezeformer/data/cv10-uk-testset-clean-punctuated/721.wav",
173
  "val_hardest_example_2_speaker": "",
174
+ "val_hardest_example_2_ref": "Нульових.",
175
+ "val_hardest_example_2_hyp": "нуульових",
176
+ "val_hardest_example_3_id": "/home/yehor/squeezeformer/data/cv10-uk-testset-clean-punctuated/3426.wav",
177
  "val_hardest_example_3_speaker": "",
178
+ "val_hardest_example_3_ref": "Украли щось?",
179
+ "val_hardest_example_3_hyp": "Украли щось.",
180
+ "val_hardest_example_4_id": "/home/yehor/squeezeformer/data/cv10-uk-testset-clean-punctuated/662.wav",
181
  "val_hardest_example_4_speaker": "",
182
+ "val_hardest_example_4_ref": "Тире?",
183
+ "val_hardest_example_4_hyp": "Тира.",
184
+ "val_random_example_0_id": "/home/yehor/squeezeformer/data/cv10-uk-testset-clean-punctuated/3097.wav",
185
  "val_random_example_0_speaker": "",
186
+ "val_random_example_0_ref": "Ніхто про це нині не хоче думати.",
187
+ "val_random_example_0_hyp": "Ніхто про це нині не хоче думати.",
188
+ "val_random_example_1_id": "/home/yehor/squeezeformer/data/cv10-uk-testset-clean-punctuated/953.wav",
189
  "val_random_example_1_speaker": "",
190
+ "val_random_example_1_ref": "А що сталося, Андрію?",
191
+ "val_random_example_1_hyp": "А що сталося, Андрію?",
192
+ "val_random_example_2_id": "/home/yehor/squeezeformer/data/cv10-uk-testset-clean-punctuated/1073.wav",
193
  "val_random_example_2_speaker": "",
194
+ "val_random_example_2_ref": "Так, як і була.",
195
+ "val_random_example_2_hyp": "Так, як і була.",
196
  "val_random_example_3_id": "/home/yehor/squeezeformer/data/cv10-uk-testset-clean-punctuated/3112.wav",
197
  "val_random_example_3_speaker": "",
198
  "val_random_example_3_ref": "Застосування мов в Україні гарантується Конституцією України та визначається законом.",
199
+ "val_random_example_3_hyp": "Застосування мов в Україні гарантується Конституцією України та визначається законо",
200
+ "val_random_example_4_id": "/home/yehor/squeezeformer/data/cv10-uk-testset-clean-punctuated/182.wav",
201
  "val_random_example_4_speaker": "",
202
+ "val_random_example_4_ref": "Один одного хваліте, тоді й Бог вас похвалить.",
203
+ "val_random_example_4_hyp": "Один одного хваліти, тоді Бог вас похвалить.",
204
+ "val/loss": 0.36097462281870185,
205
+ "val/cer": 0.045040676687678464,
206
+ "val/wer": 0.2181506999605038,
207
+ "val/main_ctc_loss": 0.36097462281870185,
208
  "val/aed_loss": 0.0,
209
  "val/liberta_distill_loss": 0.0,
210
  "val/audio_teacher_loss": 0.0,
211
+ "val/avg_blank_probability": 0.794819268942859,
212
+ "val/argmax_blank_fraction": 0.800636626983745,
213
+ "val/avg_top_nonblank_probability": 0.19556051142716604,
214
  "val/avg_output_frames": 129.72159800249688,
215
  "val/avg_target_tokens": 24.885455680399502,
216
  "val/target_tokens_per_frame": 0.1918374123013849,
217
  "val/impossible_sample_fraction": 0.0,
218
  "val/tight_sample_fraction": 0.0,
219
  "val/samples_short": 1183.0,
220
+ "val/wer_short": 0.26064545047064097,
221
+ "val/cer_short": 0.0564993655716904,
222
  "val/samples_medium": 2021.0,
223
+ "val/wer_medium": 0.20780354706684856,
224
+ "val/cer_medium": 0.042334077058843116,
225
  "val/samples_long": 0.0,
226
  "val/decoded_empty_fraction": 0.0,
227
+ "val/decoded_avg_char_length": 46.24032459425718,
228
+ "val/decoded_avg_word_length": 7.117353308364544,
229
  "val/speaker_count": 0.0,
230
  "val/speaker_macro_wer": 0.0,
231
  "val/speaker_id_available": 0.0,
232
  "val/missing_speaker_id_samples": 3204.0,
233
+ "val/forward_seconds": 301.635894693085,
234
  "val/teacher_seconds": 0.0,
235
+ "val/decode_seconds": 0.9517203441355377,
236
+ "val/gather_seconds": 5.703901747940108,
237
+ "train/loss": 0.5720258672326572,
238
+ "train/main_ctc_loss": 0.5720258672326572,
239
  "train/aed_loss": 0.0,
240
  "train/liberta_distill_loss": 0.0,
241
  "train/audio_teacher_loss": 0.0
checkpoint_step_last.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2077a53612ec551c754db2426a335571fbb7d93e511454ca0832beff8fddcd35
3
  size 2424913224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b044c369a25bcfb22956e76b8b7e334cdaab4f376a8db9570f5209b9937c9303
3
  size 2424913224
checkpoint_topk_avg.json CHANGED
@@ -431,6 +431,12 @@
431
  "val_wer": 0.20322991179181113,
432
  "path": "checkpoint_epoch=0003_step=00050000_valwer=0.203230.pt"
433
  },
 
 
 
 
 
 
434
  {
435
  "epoch": 3,
436
  "global_step": 20000,
@@ -442,12 +448,6 @@
442
  "global_step": 30000,
443
  "val_wer": 0.22912186773160134,
444
  "path": "checkpoint_epoch=0003_step=00030000_valwer=0.229122.pt"
445
- },
446
- {
447
- "epoch": 3,
448
- "global_step": 70000,
449
- "val_wer": 0.24808004564005792,
450
- "path": "checkpoint_epoch=0003_step=00070000_valwer=0.248080.pt"
451
  }
452
  ]
453
  }
 
431
  "val_wer": 0.20322991179181113,
432
  "path": "checkpoint_epoch=0003_step=00050000_valwer=0.203230.pt"
433
  },
434
+ {
435
+ "epoch": 4,
436
+ "global_step": 80000,
437
+ "val_wer": 0.2181506999605038,
438
+ "path": "checkpoint_epoch=0004_step=00080000_valwer=0.218151.pt"
439
+ },
440
  {
441
  "epoch": 3,
442
  "global_step": 20000,
 
448
  "global_step": 30000,
449
  "val_wer": 0.22912186773160134,
450
  "path": "checkpoint_epoch=0003_step=00030000_valwer=0.229122.pt"
 
 
 
 
 
 
451
  }
452
  ]
453
  }
checkpoint_topk_avg.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9f9e194cf05eb11d05f787490c93137a82202f63a45da86d1bd6ddd0fd2f90b1
3
  size 2424913224
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4eaf31f0a125e71d4cc060537a534c339d3aceab71ade0da0f55c591771049f
3
  size 2424913224
checkpoints_topk/metadata.json CHANGED
@@ -13,6 +13,12 @@
13
  "val_wer": 0.20322991179181113,
14
  "path": "checkpoint_epoch=0003_step=00050000_valwer=0.203230.pt"
15
  },
 
 
 
 
 
 
16
  {
17
  "epoch": 3,
18
  "global_step": 20000,
@@ -24,12 +30,6 @@
24
  "global_step": 30000,
25
  "val_wer": 0.22912186773160134,
26
  "path": "checkpoint_epoch=0003_step=00030000_valwer=0.229122.pt"
27
- },
28
- {
29
- "epoch": 3,
30
- "global_step": 70000,
31
- "val_wer": 0.24808004564005792,
32
- "path": "checkpoint_epoch=0003_step=00070000_valwer=0.248080.pt"
33
  }
34
  ]
35
  }
 
13
  "val_wer": 0.20322991179181113,
14
  "path": "checkpoint_epoch=0003_step=00050000_valwer=0.203230.pt"
15
  },
16
+ {
17
+ "epoch": 4,
18
+ "global_step": 80000,
19
+ "val_wer": 0.2181506999605038,
20
+ "path": "checkpoint_epoch=0004_step=00080000_valwer=0.218151.pt"
21
+ },
22
  {
23
  "epoch": 3,
24
  "global_step": 20000,
 
30
  "global_step": 30000,
31
  "val_wer": 0.22912186773160134,
32
  "path": "checkpoint_epoch=0003_step=00030000_valwer=0.229122.pt"
 
 
 
 
 
 
33
  }
34
  ]
35
  }
eval_reports/epoch_0004_step_00080000.json ADDED
@@ -0,0 +1,133 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 4,
3
+ "global_step": 80000,
4
+ "model_source": "raw",
5
+ "metrics": {
6
+ "loss": 0.36097462281870185,
7
+ "main_ctc_loss": 0.36097462281870185,
8
+ "aed_loss": 0.0,
9
+ "liberta_distill_loss": 0.0,
10
+ "audio_teacher_loss": 0.0,
11
+ "cer": 0.045040676687678464,
12
+ "wer": 0.2181506999605038,
13
+ "avg_blank_probability": 0.794819268942859,
14
+ "argmax_blank_fraction": 0.800636626983745,
15
+ "avg_top_nonblank_probability": 0.19556051142716604,
16
+ "avg_output_frames": 129.72159800249688,
17
+ "avg_target_tokens": 24.885455680399502,
18
+ "target_tokens_per_frame": 0.1918374123013849,
19
+ "impossible_sample_fraction": 0.0,
20
+ "tight_sample_fraction": 0.0,
21
+ "samples_short": 1183.0,
22
+ "wer_short": 0.26064545047064097,
23
+ "cer_short": 0.0564993655716904,
24
+ "samples_medium": 2021.0,
25
+ "wer_medium": 0.20780354706684856,
26
+ "cer_medium": 0.042334077058843116,
27
+ "samples_long": 0.0,
28
+ "decoded_empty_fraction": 0.0,
29
+ "decoded_avg_char_length": 46.24032459425718,
30
+ "decoded_avg_word_length": 7.117353308364544,
31
+ "speaker_count": 0.0,
32
+ "speaker_macro_wer": 0.0,
33
+ "speaker_id_available": 0.0,
34
+ "missing_speaker_id_samples": 3204.0
35
+ },
36
+ "hardest_examples": [
37
+ {
38
+ "utterance_id": "/home/yehor/squeezeformer/data/cv10-uk-testset-clean-punctuated/1317.wav",
39
+ "speaker_id": "",
40
+ "reference": "Чому я так кажу?",
41
+ "hypothesis": "Чому я это кажу?"
42
+ },
43
+ {
44
+ "utterance_id": "/home/yehor/squeezeformer/data/cv10-uk-testset-clean-punctuated/1920.wav",
45
+ "speaker_id": "",
46
+ "reference": "Дякую.",
47
+ "hypothesis": "Дякую!"
48
+ },
49
+ {
50
+ "utterance_id": "/home/yehor/squeezeformer/data/cv10-uk-testset-clean-punctuated/721.wav",
51
+ "speaker_id": "",
52
+ "reference": "Нульових.",
53
+ "hypothesis": "нуульових"
54
+ },
55
+ {
56
+ "utterance_id": "/home/yehor/squeezeformer/data/cv10-uk-testset-clean-punctuated/3426.wav",
57
+ "speaker_id": "",
58
+ "reference": "Украли щось?",
59
+ "hypothesis": "Украли щось."
60
+ },
61
+ {
62
+ "utterance_id": "/home/yehor/squeezeformer/data/cv10-uk-testset-clean-punctuated/662.wav",
63
+ "speaker_id": "",
64
+ "reference": "Тире?",
65
+ "hypothesis": "Тира."
66
+ }
67
+ ],
68
+ "random_examples": [
69
+ {
70
+ "utterance_id": "/home/yehor/squeezeformer/data/cv10-uk-testset-clean-punctuated/3097.wav",
71
+ "speaker_id": "",
72
+ "reference": "Ніхто про це нині не хоче думати.",
73
+ "hypothesis": "Ніхто про це нині не хоче думати."
74
+ },
75
+ {
76
+ "utterance_id": "/home/yehor/squeezeformer/data/cv10-uk-testset-clean-punctuated/953.wav",
77
+ "speaker_id": "",
78
+ "reference": "А що сталося, Андрію?",
79
+ "hypothesis": "А що сталося, Андрію?"
80
+ },
81
+ {
82
+ "utterance_id": "/home/yehor/squeezeformer/data/cv10-uk-testset-clean-punctuated/1073.wav",
83
+ "speaker_id": "",
84
+ "reference": "Так, як і була.",
85
+ "hypothesis": "Так, як і була."
86
+ },
87
+ {
88
+ "utterance_id": "/home/yehor/squeezeformer/data/cv10-uk-testset-clean-punctuated/3112.wav",
89
+ "speaker_id": "",
90
+ "reference": "Застосування мов в Україні гарантується Конституцією України та визначається законом.",
91
+ "hypothesis": "Застосування мов в Україні гарантується Конституцією України та визначається законо"
92
+ },
93
+ {
94
+ "utterance_id": "/home/yehor/squeezeformer/data/cv10-uk-testset-clean-punctuated/182.wav",
95
+ "speaker_id": "",
96
+ "reference": "Один одного хваліте, тоді й Бог вас похвалить.",
97
+ "hypothesis": "Один одного хваліти, тоді Бог вас похвалить."
98
+ }
99
+ ],
100
+ "speaker_metrics": {
101
+ "speaker_count": 0,
102
+ "speaker_macro_wer": 0.0,
103
+ "speaker_id_available": false,
104
+ "missing_speaker_id_samples": 3204,
105
+ "per_speaker": {}
106
+ },
107
+ "split_audit": {
108
+ "counts": {
109
+ "train": {
110
+ "samples": 648240,
111
+ "speakers": 0,
112
+ "records_with_speaker_id": 0,
113
+ "hours": 1264.353836267957
114
+ },
115
+ "validation": {
116
+ "samples": 3204,
117
+ "speakers": 0,
118
+ "records_with_speaker_id": 0,
119
+ "hours": 4.629311440972232
120
+ }
121
+ },
122
+ "hours": {
123
+ "train": 1264.353836267957,
124
+ "validation": 4.629311440972232
125
+ },
126
+ "total_hours": 1268.9831477089292,
127
+ "speaker_overlaps": {
128
+ "train_vs_validation": 0
129
+ },
130
+ "speaker_balance_ratio": 1.0,
131
+ "speaker_id_available": false
132
+ }
133
+ }
training_20260415_090229.log CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8dbe3e09d7d120ef4658b1312f7c994a7b19b4e07eb63b4675592fb9a04eac87
3
- size 11070395
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:440777b8f5e9a4a846cbc5230579b8b6819704b6e9a1a92020075828a00287d3
3
+ size 11168674