samil24 commited on
Commit
b50eeec
·
verified ·
1 Parent(s): b76c0a1

End of training

Browse files
Files changed (2) hide show
  1. README.md +48 -12
  2. generation_config.json +2 -94
README.md CHANGED
@@ -18,9 +18,9 @@ should probably proofread and complete it, then remove this comment. -->
18
 
19
  This model is a fine-tuned version of [openai/whisper-large-v3](https://huggingface.co/openai/whisper-large-v3) on the None dataset.
20
  It achieves the following results on the evaluation set:
21
- - Loss: 0.2801
22
- - Wer: 84.6009
23
- - Cer: 70.1608
24
 
25
  ## Model description
26
 
@@ -39,23 +39,59 @@ More information needed
39
  ### Training hyperparameters
40
 
41
  The following hyperparameters were used during training:
42
- - learning_rate: 8e-06
43
  - train_batch_size: 16
44
  - eval_batch_size: 16
45
  - seed: 42
46
  - optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
47
  - lr_scheduler_type: cosine
48
- - lr_scheduler_warmup_steps: 8000
49
- - num_epochs: 5
50
 
51
  ### Training results
52
 
53
- | Training Loss | Epoch | Step | Validation Loss | Wer | Cer |
54
- |:-------------:|:------:|:-----:|:---------------:|:-------:|:-------:|
55
- | 0.2359 | 1.2472 | 5000 | 0.2733 | 94.9788 | 93.0093 |
56
- | 0.1824 | 2.4944 | 10000 | 0.2674 | 66.9301 | 53.0174 |
57
- | 0.1267 | 3.7416 | 15000 | 0.2587 | 79.5997 | 65.3546 |
58
- | 0.0775 | 4.9888 | 20000 | 0.2801 | 84.6009 | 70.1608 |
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
59
 
60
 
61
  ### Framework versions
 
18
 
19
  This model is a fine-tuned version of [openai/whisper-large-v3](https://huggingface.co/openai/whisper-large-v3) on the None dataset.
20
  It achieves the following results on the evaluation set:
21
+ - Loss: 0.5546
22
+ - Wer: 82.4230
23
+ - Cer: 64.5239
24
 
25
  ## Model description
26
 
 
39
  ### Training hyperparameters
40
 
41
  The following hyperparameters were used during training:
42
+ - learning_rate: 1e-05
43
  - train_batch_size: 16
44
  - eval_batch_size: 16
45
  - seed: 42
46
  - optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
47
  - lr_scheduler_type: cosine
48
+ - lr_scheduler_warmup_steps: 2000
49
+ - num_epochs: 15
50
 
51
  ### Training results
52
 
53
+ | Training Loss | Epoch | Step | Validation Loss | Wer | Cer |
54
+ |:-------------:|:-------:|:-----:|:---------------:|:--------:|:-------:|
55
+ | 0.2956 | 0.3742 | 1500 | 0.3018 | 63.6348 | 47.5770 |
56
+ | 0.2867 | 0.7483 | 3000 | 0.2841 | 93.2416 | 79.6830 |
57
+ | 0.213 | 1.1225 | 4500 | 0.2759 | 97.8988 | 85.8519 |
58
+ | 0.227 | 1.4966 | 6000 | 0.2677 | 91.6266 | 74.8936 |
59
+ | 0.2212 | 1.8708 | 7500 | 0.2617 | 93.4321 | 79.6175 |
60
+ | 0.1611 | 2.2449 | 9000 | 0.2667 | 96.8099 | 78.9492 |
61
+ | 0.1589 | 2.6191 | 10500 | 0.2643 | 100.5175 | 76.5414 |
62
+ | 0.1697 | 2.9933 | 12000 | 0.2622 | 84.5441 | 67.4836 |
63
+ | 0.1071 | 3.3674 | 13500 | 0.2855 | 96.4829 | 81.3859 |
64
+ | 0.1136 | 3.7416 | 15000 | 0.2814 | 99.5195 | 75.9088 |
65
+ | 0.0637 | 4.1157 | 16500 | 0.3122 | 83.2163 | 64.5333 |
66
+ | 0.0692 | 4.4899 | 18000 | 0.3137 | 90.7196 | 76.6609 |
67
+ | 0.0687 | 4.8641 | 19500 | 0.3179 | 91.4560 | 75.3464 |
68
+ | 0.0333 | 5.2382 | 21000 | 0.3506 | 90.0088 | 71.7452 |
69
+ | 0.0366 | 5.6124 | 22500 | 0.3571 | 86.4889 | 69.5759 |
70
+ | 0.0379 | 5.9865 | 24000 | 0.3554 | 88.3228 | 63.6308 |
71
+ | 0.0174 | 6.3607 | 25500 | 0.3917 | 91.0494 | 75.0314 |
72
+ | 0.0176 | 6.7348 | 27000 | 0.3937 | 84.2740 | 64.2078 |
73
+ | 0.0075 | 7.1090 | 28500 | 0.4261 | 83.2419 | 65.5333 |
74
+ | 0.0092 | 7.4832 | 30000 | 0.4228 | 89.9832 | 69.3133 |
75
+ | 0.0096 | 7.8573 | 31500 | 0.4328 | 86.2415 | 71.8841 |
76
+ | 0.0042 | 8.2315 | 33000 | 0.4482 | 83.1168 | 64.2068 |
77
+ | 0.0045 | 8.6056 | 34500 | 0.4502 | 86.0169 | 67.4873 |
78
+ | 0.005 | 8.9798 | 36000 | 0.4580 | 83.4096 | 65.3331 |
79
+ | 0.0027 | 9.3540 | 37500 | 0.4667 | 82.2837 | 60.9284 |
80
+ | 0.0027 | 9.7281 | 39000 | 0.4718 | 84.5469 | 63.7325 |
81
+ | 0.0012 | 10.1023 | 40500 | 0.4819 | 80.8678 | 62.0516 |
82
+ | 0.0012 | 10.4764 | 42000 | 0.4911 | 81.6951 | 59.3660 |
83
+ | 0.0013 | 10.8506 | 43500 | 0.4950 | 78.6415 | 60.5107 |
84
+ | 0.0005 | 11.2247 | 45000 | 0.5076 | 81.8117 | 62.4285 |
85
+ | 0.0005 | 11.5989 | 46500 | 0.5055 | 78.8746 | 59.2439 |
86
+ | 0.0008 | 11.9731 | 48000 | 0.5101 | 79.2244 | 59.3010 |
87
+ | 0.0006 | 12.3472 | 49500 | 0.5234 | 81.2459 | 63.5160 |
88
+ | 0.0002 | 12.7214 | 51000 | 0.5310 | 83.3272 | 65.2183 |
89
+ | 0.0001 | 13.0955 | 52500 | 0.5380 | 83.5347 | 65.1864 |
90
+ | 0.0001 | 13.4697 | 54000 | 0.5450 | 81.4990 | 63.0972 |
91
+ | 0.0001 | 13.8439 | 55500 | 0.5491 | 82.4230 | 64.9317 |
92
+ | 0.0001 | 14.2180 | 57000 | 0.5523 | 82.3889 | 64.7414 |
93
+ | 0.0001 | 14.5922 | 58500 | 0.5544 | 82.5510 | 64.7718 |
94
+ | 0.0001 | 14.9663 | 60000 | 0.5546 | 82.4230 | 64.5239 |
95
 
96
 
97
  ### Framework versions
generation_config.json CHANGED
@@ -41,10 +41,7 @@
41
  6
42
  ]
43
  ],
44
- "begin_suppress_tokens": [
45
- 220,
46
- 50257
47
- ],
48
  "bos_token_id": 50257,
49
  "decoder_start_token_id": 50258,
50
  "eos_token_id": 50257,
@@ -151,102 +148,13 @@
151
  "<|yue|>": 50358,
152
  "<|zh|>": 50260
153
  },
 
154
  "max_initial_timestamp_index": 50,
155
  "max_length": 448,
156
  "no_timestamps_token_id": 50364,
157
  "pad_token_id": 50257,
158
  "prev_sot_token_id": 50362,
159
  "return_timestamps": false,
160
- "suppress_tokens": [
161
- 1,
162
- 2,
163
- 7,
164
- 8,
165
- 9,
166
- 10,
167
- 14,
168
- 25,
169
- 26,
170
- 27,
171
- 28,
172
- 29,
173
- 31,
174
- 58,
175
- 59,
176
- 60,
177
- 61,
178
- 62,
179
- 63,
180
- 90,
181
- 91,
182
- 92,
183
- 93,
184
- 359,
185
- 503,
186
- 522,
187
- 542,
188
- 873,
189
- 893,
190
- 902,
191
- 918,
192
- 922,
193
- 931,
194
- 1350,
195
- 1853,
196
- 1982,
197
- 2460,
198
- 2627,
199
- 3246,
200
- 3253,
201
- 3268,
202
- 3536,
203
- 3846,
204
- 3961,
205
- 4183,
206
- 4667,
207
- 6585,
208
- 6647,
209
- 7273,
210
- 9061,
211
- 9383,
212
- 10428,
213
- 10929,
214
- 11938,
215
- 12033,
216
- 12331,
217
- 12562,
218
- 13793,
219
- 14157,
220
- 14635,
221
- 15265,
222
- 15618,
223
- 16553,
224
- 16604,
225
- 18362,
226
- 18956,
227
- 20075,
228
- 21675,
229
- 22520,
230
- 26130,
231
- 26161,
232
- 26435,
233
- 28279,
234
- 29464,
235
- 31650,
236
- 32302,
237
- 32470,
238
- 36865,
239
- 42863,
240
- 47425,
241
- 49870,
242
- 50254,
243
- 50258,
244
- 50359,
245
- 50360,
246
- 50361,
247
- 50362,
248
- 50363
249
- ],
250
  "task": "transcribe",
251
  "task_to_id": {
252
  "transcribe": 50360,
 
41
  6
42
  ]
43
  ],
44
+ "begin_suppress_tokens": [],
 
 
 
45
  "bos_token_id": 50257,
46
  "decoder_start_token_id": 50258,
47
  "eos_token_id": 50257,
 
148
  "<|yue|>": 50358,
149
  "<|zh|>": 50260
150
  },
151
+ "language": "ar",
152
  "max_initial_timestamp_index": 50,
153
  "max_length": 448,
154
  "no_timestamps_token_id": 50364,
155
  "pad_token_id": 50257,
156
  "prev_sot_token_id": 50362,
157
  "return_timestamps": false,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
158
  "task": "transcribe",
159
  "task_to_id": {
160
  "transcribe": 50360,