utakumi commited on
Commit
98690de
·
verified ·
1 Parent(s): 97999fa

End of training

Browse files
Files changed (5) hide show
  1. README.md +8 -4
  2. all_results.json +16 -0
  3. eval_results.json +10 -0
  4. train_results.json +9 -0
  5. trainer_state.json +357 -0
README.md CHANGED
@@ -1,8 +1,12 @@
1
  ---
2
  library_name: transformers
 
 
3
  license: apache-2.0
4
  base_model: rinna/japanese-hubert-base
5
  tags:
 
 
6
  - generated_from_trainer
7
  metrics:
8
  - wer
@@ -16,11 +20,11 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  # Hubert-common_voice-phoneme-onlyJSUT
18
 
19
- This model is a fine-tuned version of [rinna/japanese-hubert-base](https://huggingface.co/rinna/japanese-hubert-base) on the None dataset.
20
  It achieves the following results on the evaluation set:
21
- - Loss: 0.1617
22
- - Wer: 0.998
23
- - Cer: 0.1060
24
 
25
  ## Model description
26
 
 
1
  ---
2
  library_name: transformers
3
+ language:
4
+ - ja
5
  license: apache-2.0
6
  base_model: rinna/japanese-hubert-base
7
  tags:
8
+ - automatic-speech-recognition
9
+ - mozilla-foundation/common_voice_13_0
10
  - generated_from_trainer
11
  metrics:
12
  - wer
 
20
 
21
  # Hubert-common_voice-phoneme-onlyJSUT
22
 
23
+ This model is a fine-tuned version of [rinna/japanese-hubert-base](https://huggingface.co/rinna/japanese-hubert-base) on the MOZILLA-FOUNDATION/COMMON_VOICE_13_0 - JA dataset.
24
  It achieves the following results on the evaluation set:
25
+ - Loss: 0.1563
26
+ - Wer: 1.0
27
+ - Cer: 0.1052
28
 
29
  ## Model description
30
 
all_results.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 20.0,
3
+ "eval_cer": 0.10522982265653276,
4
+ "eval_loss": 0.15634456276893616,
5
+ "eval_runtime": 20.6964,
6
+ "eval_samples": 500,
7
+ "eval_samples_per_second": 24.159,
8
+ "eval_steps_per_second": 3.044,
9
+ "eval_wer": 1.0,
10
+ "total_flos": 4.085369652431226e+18,
11
+ "train_loss": 2.2413718947282075,
12
+ "train_runtime": 5214.7646,
13
+ "train_samples": 4500,
14
+ "train_samples_per_second": 17.259,
15
+ "train_steps_per_second": 0.541
16
+ }
eval_results.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 20.0,
3
+ "eval_cer": 0.10522982265653276,
4
+ "eval_loss": 0.15634456276893616,
5
+ "eval_runtime": 20.6964,
6
+ "eval_samples": 500,
7
+ "eval_samples_per_second": 24.159,
8
+ "eval_steps_per_second": 3.044,
9
+ "eval_wer": 1.0
10
+ }
train_results.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 20.0,
3
+ "total_flos": 4.085369652431226e+18,
4
+ "train_loss": 2.2413718947282075,
5
+ "train_runtime": 5214.7646,
6
+ "train_samples": 4500,
7
+ "train_samples_per_second": 17.259,
8
+ "train_steps_per_second": 0.541
9
+ }
trainer_state.json ADDED
@@ -0,0 +1,357 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.16017669439315796,
3
+ "best_model_checkpoint": "./Hubert-common_voice-phoneme-onlyJSUT/checkpoint-2600",
4
+ "epoch": 20.0,
5
+ "eval_steps": 100,
6
+ "global_step": 2820,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.7092198581560284,
13
+ "eval_cer": 0.9860960308843045,
14
+ "eval_loss": 11.361393928527832,
15
+ "eval_runtime": 21.3659,
16
+ "eval_samples_per_second": 23.402,
17
+ "eval_steps_per_second": 2.949,
18
+ "eval_wer": 1.054,
19
+ "step": 100
20
+ },
21
+ {
22
+ "epoch": 1.4184397163120568,
23
+ "eval_cer": 0.9851007359150682,
24
+ "eval_loss": 5.935764789581299,
25
+ "eval_runtime": 21.3202,
26
+ "eval_samples_per_second": 23.452,
27
+ "eval_steps_per_second": 2.955,
28
+ "eval_wer": 1.0,
29
+ "step": 200
30
+ },
31
+ {
32
+ "epoch": 2.127659574468085,
33
+ "eval_cer": 0.9850705754614549,
34
+ "eval_loss": 5.310074329376221,
35
+ "eval_runtime": 20.7223,
36
+ "eval_samples_per_second": 24.129,
37
+ "eval_steps_per_second": 3.04,
38
+ "eval_wer": 1.0,
39
+ "step": 300
40
+ },
41
+ {
42
+ "epoch": 2.8368794326241136,
43
+ "eval_cer": 0.9851007359150682,
44
+ "eval_loss": 4.895324230194092,
45
+ "eval_runtime": 20.9802,
46
+ "eval_samples_per_second": 23.832,
47
+ "eval_steps_per_second": 3.003,
48
+ "eval_wer": 1.0,
49
+ "step": 400
50
+ },
51
+ {
52
+ "epoch": 3.546099290780142,
53
+ "grad_norm": 18.17830467224121,
54
+ "learning_rate": 1.1903999999999998e-05,
55
+ "loss": 6.9061,
56
+ "step": 500
57
+ },
58
+ {
59
+ "epoch": 3.546099290780142,
60
+ "eval_cer": 0.9851007359150682,
61
+ "eval_loss": 4.402055740356445,
62
+ "eval_runtime": 21.0039,
63
+ "eval_samples_per_second": 23.805,
64
+ "eval_steps_per_second": 2.999,
65
+ "eval_wer": 1.0,
66
+ "step": 500
67
+ },
68
+ {
69
+ "epoch": 4.25531914893617,
70
+ "eval_cer": 0.9851007359150682,
71
+ "eval_loss": 3.9323222637176514,
72
+ "eval_runtime": 21.0838,
73
+ "eval_samples_per_second": 23.715,
74
+ "eval_steps_per_second": 2.988,
75
+ "eval_wer": 1.0,
76
+ "step": 600
77
+ },
78
+ {
79
+ "epoch": 4.964539007092198,
80
+ "eval_cer": 0.9851007359150682,
81
+ "eval_loss": 3.4932363033294678,
82
+ "eval_runtime": 20.4799,
83
+ "eval_samples_per_second": 24.414,
84
+ "eval_steps_per_second": 3.076,
85
+ "eval_wer": 1.0,
86
+ "step": 700
87
+ },
88
+ {
89
+ "epoch": 5.673758865248227,
90
+ "eval_cer": 0.9850404150078417,
91
+ "eval_loss": 3.209160566329956,
92
+ "eval_runtime": 21.0193,
93
+ "eval_samples_per_second": 23.788,
94
+ "eval_steps_per_second": 2.997,
95
+ "eval_wer": 1.0,
96
+ "step": 800
97
+ },
98
+ {
99
+ "epoch": 6.382978723404255,
100
+ "eval_cer": 0.9850705754614549,
101
+ "eval_loss": 3.0484230518341064,
102
+ "eval_runtime": 20.7411,
103
+ "eval_samples_per_second": 24.107,
104
+ "eval_steps_per_second": 3.037,
105
+ "eval_wer": 1.0,
106
+ "step": 900
107
+ },
108
+ {
109
+ "epoch": 7.092198581560283,
110
+ "grad_norm": 0.6846523284912109,
111
+ "learning_rate": 2.3903999999999997e-05,
112
+ "loss": 3.4303,
113
+ "step": 1000
114
+ },
115
+ {
116
+ "epoch": 7.092198581560283,
117
+ "eval_cer": 0.9850404150078417,
118
+ "eval_loss": 2.9960806369781494,
119
+ "eval_runtime": 20.4215,
120
+ "eval_samples_per_second": 24.484,
121
+ "eval_steps_per_second": 3.085,
122
+ "eval_wer": 1.0,
123
+ "step": 1000
124
+ },
125
+ {
126
+ "epoch": 7.801418439716312,
127
+ "eval_cer": 0.9850102545542285,
128
+ "eval_loss": 2.799971580505371,
129
+ "eval_runtime": 20.9162,
130
+ "eval_samples_per_second": 23.905,
131
+ "eval_steps_per_second": 3.012,
132
+ "eval_wer": 1.0,
133
+ "step": 1100
134
+ },
135
+ {
136
+ "epoch": 8.51063829787234,
137
+ "eval_cer": 0.5949149475208108,
138
+ "eval_loss": 1.9060593843460083,
139
+ "eval_runtime": 21.115,
140
+ "eval_samples_per_second": 23.68,
141
+ "eval_steps_per_second": 2.984,
142
+ "eval_wer": 1.0,
143
+ "step": 1200
144
+ },
145
+ {
146
+ "epoch": 9.21985815602837,
147
+ "eval_cer": 0.1546929665822174,
148
+ "eval_loss": 0.8767441511154175,
149
+ "eval_runtime": 20.8067,
150
+ "eval_samples_per_second": 24.031,
151
+ "eval_steps_per_second": 3.028,
152
+ "eval_wer": 1.0,
153
+ "step": 1300
154
+ },
155
+ {
156
+ "epoch": 9.929078014184396,
157
+ "eval_cer": 0.12679454698998674,
158
+ "eval_loss": 0.5386155843734741,
159
+ "eval_runtime": 21.0364,
160
+ "eval_samples_per_second": 23.768,
161
+ "eval_steps_per_second": 2.995,
162
+ "eval_wer": 1.0,
163
+ "step": 1400
164
+ },
165
+ {
166
+ "epoch": 10.638297872340425,
167
+ "grad_norm": 2.450634241104126,
168
+ "learning_rate": 3.5903999999999994e-05,
169
+ "loss": 1.6163,
170
+ "step": 1500
171
+ },
172
+ {
173
+ "epoch": 10.638297872340425,
174
+ "eval_cer": 0.11901314995777537,
175
+ "eval_loss": 0.38196861743927,
176
+ "eval_runtime": 21.1077,
177
+ "eval_samples_per_second": 23.688,
178
+ "eval_steps_per_second": 2.985,
179
+ "eval_wer": 1.0,
180
+ "step": 1500
181
+ },
182
+ {
183
+ "epoch": 11.347517730496454,
184
+ "eval_cer": 0.11382555193630112,
185
+ "eval_loss": 0.298287034034729,
186
+ "eval_runtime": 21.1084,
187
+ "eval_samples_per_second": 23.687,
188
+ "eval_steps_per_second": 2.985,
189
+ "eval_wer": 1.0,
190
+ "step": 1600
191
+ },
192
+ {
193
+ "epoch": 12.056737588652481,
194
+ "eval_cer": 0.11165399927614911,
195
+ "eval_loss": 0.25243452191352844,
196
+ "eval_runtime": 20.9043,
197
+ "eval_samples_per_second": 23.919,
198
+ "eval_steps_per_second": 3.014,
199
+ "eval_wer": 1.0,
200
+ "step": 1700
201
+ },
202
+ {
203
+ "epoch": 12.76595744680851,
204
+ "eval_cer": 0.110417420678007,
205
+ "eval_loss": 0.22604165971279144,
206
+ "eval_runtime": 20.6318,
207
+ "eval_samples_per_second": 24.234,
208
+ "eval_steps_per_second": 3.054,
209
+ "eval_wer": 1.0,
210
+ "step": 1800
211
+ },
212
+ {
213
+ "epoch": 13.47517730496454,
214
+ "eval_cer": 0.11099046929665822,
215
+ "eval_loss": 0.20960931479930878,
216
+ "eval_runtime": 20.9655,
217
+ "eval_samples_per_second": 23.849,
218
+ "eval_steps_per_second": 3.005,
219
+ "eval_wer": 1.0,
220
+ "step": 1900
221
+ },
222
+ {
223
+ "epoch": 14.184397163120567,
224
+ "grad_norm": 1.458462119102478,
225
+ "learning_rate": 4.7903999999999994e-05,
226
+ "loss": 0.332,
227
+ "step": 2000
228
+ },
229
+ {
230
+ "epoch": 14.184397163120567,
231
+ "eval_cer": 0.10924116298709133,
232
+ "eval_loss": 0.18963314592838287,
233
+ "eval_runtime": 20.9261,
234
+ "eval_samples_per_second": 23.894,
235
+ "eval_steps_per_second": 3.011,
236
+ "eval_wer": 0.998,
237
+ "step": 2000
238
+ },
239
+ {
240
+ "epoch": 14.893617021276595,
241
+ "eval_cer": 0.10945228616238388,
242
+ "eval_loss": 0.1838211864233017,
243
+ "eval_runtime": 20.7677,
244
+ "eval_samples_per_second": 24.076,
245
+ "eval_steps_per_second": 3.034,
246
+ "eval_wer": 1.0,
247
+ "step": 2100
248
+ },
249
+ {
250
+ "epoch": 15.602836879432624,
251
+ "eval_cer": 0.10806490529617566,
252
+ "eval_loss": 0.17658106982707977,
253
+ "eval_runtime": 21.0918,
254
+ "eval_samples_per_second": 23.706,
255
+ "eval_steps_per_second": 2.987,
256
+ "eval_wer": 1.0,
257
+ "step": 2200
258
+ },
259
+ {
260
+ "epoch": 16.31205673758865,
261
+ "eval_cer": 0.10706961032693932,
262
+ "eval_loss": 0.1687668263912201,
263
+ "eval_runtime": 20.9189,
264
+ "eval_samples_per_second": 23.902,
265
+ "eval_steps_per_second": 3.012,
266
+ "eval_wer": 0.998,
267
+ "step": 2300
268
+ },
269
+ {
270
+ "epoch": 17.02127659574468,
271
+ "eval_cer": 0.1069188080588732,
272
+ "eval_loss": 0.16668924689292908,
273
+ "eval_runtime": 21.205,
274
+ "eval_samples_per_second": 23.579,
275
+ "eval_steps_per_second": 2.971,
276
+ "eval_wer": 0.998,
277
+ "step": 2400
278
+ },
279
+ {
280
+ "epoch": 17.73049645390071,
281
+ "grad_norm": 2.1788010597229004,
282
+ "learning_rate": 5.9903999999999994e-05,
283
+ "loss": 0.2296,
284
+ "step": 2500
285
+ },
286
+ {
287
+ "epoch": 17.73049645390071,
288
+ "eval_cer": 0.10688864760525998,
289
+ "eval_loss": 0.16431093215942383,
290
+ "eval_runtime": 21.0484,
291
+ "eval_samples_per_second": 23.755,
292
+ "eval_steps_per_second": 2.993,
293
+ "eval_wer": 1.0,
294
+ "step": 2500
295
+ },
296
+ {
297
+ "epoch": 18.43971631205674,
298
+ "eval_cer": 0.10706961032693932,
299
+ "eval_loss": 0.16017669439315796,
300
+ "eval_runtime": 20.7713,
301
+ "eval_samples_per_second": 24.072,
302
+ "eval_steps_per_second": 3.033,
303
+ "eval_wer": 1.0,
304
+ "step": 2600
305
+ },
306
+ {
307
+ "epoch": 19.148936170212767,
308
+ "eval_cer": 0.10682832669803353,
309
+ "eval_loss": 0.16536767780780792,
310
+ "eval_runtime": 21.3386,
311
+ "eval_samples_per_second": 23.432,
312
+ "eval_steps_per_second": 2.952,
313
+ "eval_wer": 1.0,
314
+ "step": 2700
315
+ },
316
+ {
317
+ "epoch": 19.858156028368793,
318
+ "eval_cer": 0.10604415490408976,
319
+ "eval_loss": 0.16166533529758453,
320
+ "eval_runtime": 21.3062,
321
+ "eval_samples_per_second": 23.467,
322
+ "eval_steps_per_second": 2.957,
323
+ "eval_wer": 0.998,
324
+ "step": 2800
325
+ },
326
+ {
327
+ "epoch": 20.0,
328
+ "step": 2820,
329
+ "total_flos": 4.085369652431226e+18,
330
+ "train_loss": 2.2413718947282075,
331
+ "train_runtime": 5214.7646,
332
+ "train_samples_per_second": 17.259,
333
+ "train_steps_per_second": 0.541
334
+ }
335
+ ],
336
+ "logging_steps": 500,
337
+ "max_steps": 2820,
338
+ "num_input_tokens_seen": 0,
339
+ "num_train_epochs": 20,
340
+ "save_steps": 400,
341
+ "stateful_callbacks": {
342
+ "TrainerControl": {
343
+ "args": {
344
+ "should_epoch_stop": false,
345
+ "should_evaluate": false,
346
+ "should_log": false,
347
+ "should_save": true,
348
+ "should_training_stop": true
349
+ },
350
+ "attributes": {}
351
+ }
352
+ },
353
+ "total_flos": 4.085369652431226e+18,
354
+ "train_batch_size": 16,
355
+ "trial_name": null,
356
+ "trial_params": null
357
+ }