longdnk commited on
Commit
343d222
·
verified ·
1 Parent(s): deac3b3

Upload 12 files

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8100fede3ebe12028e1a6a943068124b87c44e904129909600f8aa61534da523
3
  size 1264702096
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db26089639bed1d2042ae44508cfe824d8a32650e6c7a551b589f9d746235bc1
3
  size 1264702096
optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:64f466b795a2b3f1ba9a0a42ea3004a4fecc0d41800f8d661e39d9eeb5c1c572
3
  size 2495948982
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34a41698f332471e4edf3ba686ae22f0a6f4731aa35ba0f155586809001de0d1
3
  size 2495948982
rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ad8e0e131aa62acb514576ec4fc6d35c4209b434e53cc06404b8837a81316972
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea2014619ab560562b67af3ac493f171046c4761b85b6e9309d2e81fe852477e
3
  size 14244
scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b37cc57efe149b952d1d08baf340d5ff65995cd05283b74a9e6abf14b366d6de
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:623a857fed43a56c0eb1d901869237571e3979cc10ac0751899d9842563263de
3
  size 1064
special_tokens_map.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "<unk>", "pad_token": "<pad>"}
tokenizer_config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"unk_token": "<unk>", "bos_token": "<s>", "eos_token": "</s>", "pad_token": "<pad>", "do_lower_case": true, "word_delimiter_token": "|", "tokenizer_class": "Wav2Vec2CTCTokenizer"}
trainer_state.json CHANGED
@@ -1,96 +1,296 @@
1
  {
2
- "best_metric": 0.14490656554698944,
3
- "best_model_checkpoint": "./wav2vec2-base-demo/checkpoint-2000",
4
- "epoch": 0.986679822397632,
5
  "eval_steps": 500,
6
- "global_step": 2000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.246669955599408,
13
- "grad_norm": 3.482757329940796,
14
  "learning_rate": 4.97e-05,
15
- "loss": 0.445,
16
  "step": 500
17
  },
18
  {
19
- "epoch": 0.246669955599408,
20
- "eval_cer": 0.03472612578852039,
21
- "eval_loss": 0.1506977081298828,
22
- "eval_mer": 0.2400241837968561,
23
- "eval_runtime": 72.835,
24
- "eval_samples_per_second": 16.695,
25
- "eval_steps_per_second": 2.087,
26
- "eval_wer": 0.24393241167434715,
27
- "eval_wil": 0.4027411629459634,
28
- "eval_wip": 0.5972588370540366,
29
  "step": 500
30
  },
31
  {
32
- "epoch": 0.493339911198816,
33
- "grad_norm": 2.1172962188720703,
34
- "learning_rate": 4.5547392940333276e-05,
35
- "loss": 0.4275,
36
  "step": 1000
37
  },
38
  {
39
- "epoch": 0.493339911198816,
40
- "eval_cer": 0.03416401224158391,
41
- "eval_loss": 0.15176725387573242,
42
- "eval_mer": 0.23524069028156222,
43
- "eval_runtime": 72.5697,
44
- "eval_samples_per_second": 16.756,
45
- "eval_steps_per_second": 2.095,
46
- "eval_wer": 0.23870967741935484,
47
- "eval_wil": 0.3973965187752956,
48
- "eval_wip": 0.6026034812247044,
49
  "step": 1000
50
  },
51
  {
52
- "epoch": 0.740009866798224,
53
- "grad_norm": 3.9609649181365967,
54
- "learning_rate": 4.1067908976885865e-05,
55
- "loss": 0.4367,
56
  "step": 1500
57
  },
58
  {
59
- "epoch": 0.740009866798224,
60
- "eval_cer": 0.032727499843857345,
61
- "eval_loss": 0.14839377999305725,
62
- "eval_mer": 0.21904472163066627,
63
- "eval_runtime": 72.6193,
64
- "eval_samples_per_second": 16.745,
65
- "eval_steps_per_second": 2.093,
66
- "eval_wer": 0.22119815668202766,
67
- "eval_wil": 0.3745997578877486,
68
- "eval_wip": 0.6254002421122514,
69
  "step": 1500
70
  },
71
  {
72
- "epoch": 0.986679822397632,
73
- "grad_norm": 3.834362268447876,
74
- "learning_rate": 3.6588425013438454e-05,
75
- "loss": 0.4128,
76
  "step": 2000
77
  },
78
  {
79
- "epoch": 0.986679822397632,
80
- "eval_cer": 0.032602585722315905,
81
- "eval_loss": 0.14490656554698944,
82
- "eval_mer": 0.21031746031746032,
83
- "eval_runtime": 72.7757,
84
- "eval_samples_per_second": 16.709,
85
- "eval_steps_per_second": 2.089,
86
- "eval_wer": 0.21167434715821812,
87
- "eval_wil": 0.3614631097880948,
88
- "eval_wip": 0.6385368902119052,
89
  "step": 2000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
90
  }
91
  ],
92
  "logging_steps": 500,
93
- "max_steps": 6081,
94
  "num_input_tokens_seen": 0,
95
  "num_train_epochs": 3,
96
  "save_steps": 500,
@@ -101,13 +301,13 @@
101
  "should_evaluate": false,
102
  "should_log": false,
103
  "should_save": true,
104
- "should_training_stop": false
105
  },
106
  "attributes": {}
107
  }
108
  },
109
- "total_flos": 3.2957716566380933e+18,
110
- "train_batch_size": 12,
111
  "trial_name": null,
112
  "trial_params": null
113
  }
 
1
  {
2
+ "best_metric": 0.11605404317378998,
3
+ "best_model_checkpoint": "./wav2vec2-base-demo/checkpoint-7000",
4
+ "epoch": 3.0,
5
  "eval_steps": 500,
6
+ "global_step": 7296,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.20559210526315788,
13
+ "grad_norm": 1.0479871034622192,
14
  "learning_rate": 4.97e-05,
15
+ "loss": 0.2427,
16
  "step": 500
17
  },
18
  {
19
+ "epoch": 0.20559210526315788,
20
+ "eval_cer": 0.03330171560541076,
21
+ "eval_loss": 0.14631743729114532,
22
+ "eval_mer": 0.2295178941141674,
23
+ "eval_runtime": 73.5989,
24
+ "eval_samples_per_second": 16.522,
25
+ "eval_steps_per_second": 2.065,
26
+ "eval_wer": 0.23178016726403824,
27
+ "eval_wil": 0.38783171622631485,
28
+ "eval_wip": 0.6121682837736852,
29
  "step": 500
30
  },
31
  {
32
+ "epoch": 0.41118421052631576,
33
+ "grad_norm": 7.891260147094727,
34
+ "learning_rate": 4.634343731606828e-05,
35
+ "loss": 0.129,
36
  "step": 1000
37
  },
38
  {
39
+ "epoch": 0.41118421052631576,
40
+ "eval_cer": 0.034745133619267565,
41
+ "eval_loss": 0.15320204198360443,
42
+ "eval_mer": 0.22595870206489677,
43
+ "eval_runtime": 73.4082,
44
+ "eval_samples_per_second": 16.565,
45
+ "eval_steps_per_second": 2.071,
46
+ "eval_wer": 0.22879330943847073,
47
+ "eval_wil": 0.38389337364965037,
48
+ "eval_wip": 0.6161066263503496,
49
  "step": 1000
50
  },
51
  {
52
+ "epoch": 0.6167763157894737,
53
+ "grad_norm": 3.9030227661132812,
54
+ "learning_rate": 4.266480282519129e-05,
55
+ "loss": 0.1431,
56
  "step": 1500
57
  },
58
  {
59
+ "epoch": 0.6167763157894737,
60
+ "eval_cer": 0.034745133619267565,
61
+ "eval_loss": 0.15051577985286713,
62
+ "eval_mer": 0.23915626856803326,
63
+ "eval_runtime": 73.4176,
64
+ "eval_samples_per_second": 16.563,
65
+ "eval_steps_per_second": 2.07,
66
+ "eval_wer": 0.240442054958184,
67
+ "eval_wil": 0.397231780167264,
68
+ "eval_wip": 0.602768219832736,
69
  "step": 1500
70
  },
71
  {
72
+ "epoch": 0.8223684210526315,
73
+ "grad_norm": 1.7316572666168213,
74
+ "learning_rate": 3.8986168334314304e-05,
75
+ "loss": 0.1393,
76
  "step": 2000
77
  },
78
  {
79
+ "epoch": 0.8223684210526315,
80
+ "eval_cer": 0.03425024744308809,
81
+ "eval_loss": 0.14699852466583252,
82
+ "eval_mer": 0.2295903330386089,
83
+ "eval_runtime": 73.3571,
84
+ "eval_samples_per_second": 16.576,
85
+ "eval_steps_per_second": 2.072,
86
+ "eval_wer": 0.23267622461170848,
87
+ "eval_wil": 0.38674316181876667,
88
+ "eval_wip": 0.6132568381812333,
89
  "step": 2000
90
+ },
91
+ {
92
+ "epoch": 1.0279605263157894,
93
+ "grad_norm": 1.396478533744812,
94
+ "learning_rate": 3.530753384343732e-05,
95
+ "loss": 0.1505,
96
+ "step": 2500
97
+ },
98
+ {
99
+ "epoch": 1.0279605263157894,
100
+ "eval_cer": 0.033136753546684265,
101
+ "eval_loss": 0.14985224604606628,
102
+ "eval_mer": 0.2275943396226415,
103
+ "eval_runtime": 74.0264,
104
+ "eval_samples_per_second": 16.427,
105
+ "eval_steps_per_second": 2.053,
106
+ "eval_wer": 0.23058542413381122,
107
+ "eval_wil": 0.38484887915314825,
108
+ "eval_wip": 0.6151511208468518,
109
+ "step": 2500
110
+ },
111
+ {
112
+ "epoch": 1.2335526315789473,
113
+ "grad_norm": 0.4791443347930908,
114
+ "learning_rate": 3.163625662154209e-05,
115
+ "loss": 0.1636,
116
+ "step": 3000
117
+ },
118
+ {
119
+ "epoch": 1.2335526315789473,
120
+ "eval_cer": 0.03352853843615968,
121
+ "eval_loss": 0.14658136665821075,
122
+ "eval_mer": 0.2253104671791839,
123
+ "eval_runtime": 73.6214,
124
+ "eval_samples_per_second": 16.517,
125
+ "eval_steps_per_second": 2.065,
126
+ "eval_wer": 0.22759856630824374,
127
+ "eval_wil": 0.38094846443763386,
128
+ "eval_wip": 0.6190515355623661,
129
+ "step": 3000
130
+ },
131
+ {
132
+ "epoch": 1.4391447368421053,
133
+ "grad_norm": 0.7940099239349365,
134
+ "learning_rate": 2.79576221306651e-05,
135
+ "loss": 0.179,
136
+ "step": 3500
137
+ },
138
+ {
139
+ "epoch": 1.4391447368421053,
140
+ "eval_cer": 0.03336357637743319,
141
+ "eval_loss": 0.13871586322784424,
142
+ "eval_mer": 0.22300884955752212,
143
+ "eval_runtime": 73.6122,
144
+ "eval_samples_per_second": 16.519,
145
+ "eval_steps_per_second": 2.065,
146
+ "eval_wer": 0.22580645161290322,
147
+ "eval_wil": 0.3782571805567654,
148
+ "eval_wip": 0.6217428194432346,
149
+ "step": 3500
150
+ },
151
+ {
152
+ "epoch": 1.6447368421052633,
153
+ "grad_norm": 1.963213562965393,
154
+ "learning_rate": 2.4278987639788112e-05,
155
+ "loss": 0.2181,
156
+ "step": 4000
157
+ },
158
+ {
159
+ "epoch": 1.6447368421052633,
160
+ "eval_cer": 0.032641867370504785,
161
+ "eval_loss": 0.13555069267749786,
162
+ "eval_mer": 0.2170839469808542,
163
+ "eval_runtime": 73.2159,
164
+ "eval_samples_per_second": 16.608,
165
+ "eval_steps_per_second": 2.076,
166
+ "eval_wer": 0.22013142174432496,
167
+ "eval_wil": 0.36858040063576636,
168
+ "eval_wip": 0.6314195993642336,
169
+ "step": 4000
170
+ },
171
+ {
172
+ "epoch": 1.850328947368421,
173
+ "grad_norm": 6.549672603607178,
174
+ "learning_rate": 2.0600353148911125e-05,
175
+ "loss": 0.2413,
176
+ "step": 4500
177
+ },
178
+ {
179
+ "epoch": 1.850328947368421,
180
+ "eval_cer": 0.030621082151105247,
181
+ "eval_loss": 0.1285562515258789,
182
+ "eval_mer": 0.2132114420524919,
183
+ "eval_runtime": 73.5544,
184
+ "eval_samples_per_second": 16.532,
185
+ "eval_steps_per_second": 2.066,
186
+ "eval_wer": 0.21594982078853048,
187
+ "eval_wil": 0.3613360451023606,
188
+ "eval_wip": 0.6386639548976394,
189
+ "step": 4500
190
+ },
191
+ {
192
+ "epoch": 2.0559210526315788,
193
+ "grad_norm": 2.745516061782837,
194
+ "learning_rate": 1.6929075927015892e-05,
195
+ "loss": 0.2935,
196
+ "step": 5000
197
+ },
198
+ {
199
+ "epoch": 2.0559210526315788,
200
+ "eval_cer": 0.029486967997360607,
201
+ "eval_loss": 0.12071426212787628,
202
+ "eval_mer": 0.2039551357733176,
203
+ "eval_runtime": 73.611,
204
+ "eval_samples_per_second": 16.519,
205
+ "eval_steps_per_second": 2.065,
206
+ "eval_wer": 0.20639187574671444,
207
+ "eval_wil": 0.34776843790653456,
208
+ "eval_wip": 0.6522315620934654,
209
+ "step": 5000
210
+ },
211
+ {
212
+ "epoch": 2.2615131578947367,
213
+ "grad_norm": 1.6406818628311157,
214
+ "learning_rate": 1.3265155974102414e-05,
215
+ "loss": 0.3035,
216
+ "step": 5500
217
+ },
218
+ {
219
+ "epoch": 2.2615131578947367,
220
+ "eval_cer": 0.02928076542395249,
221
+ "eval_loss": 0.11994051933288574,
222
+ "eval_mer": 0.19940828402366864,
223
+ "eval_runtime": 73.791,
224
+ "eval_samples_per_second": 16.479,
225
+ "eval_steps_per_second": 2.06,
226
+ "eval_wer": 0.2013142174432497,
227
+ "eval_wil": 0.34143103677153863,
228
+ "eval_wip": 0.6585689632284614,
229
+ "step": 5500
230
+ },
231
+ {
232
+ "epoch": 2.4671052631578947,
233
+ "grad_norm": 1.5923278331756592,
234
+ "learning_rate": 9.586521483225428e-06,
235
+ "loss": 0.3185,
236
+ "step": 6000
237
+ },
238
+ {
239
+ "epoch": 2.4671052631578947,
240
+ "eval_cer": 0.028909600791817883,
241
+ "eval_loss": 0.11905083060264587,
242
+ "eval_mer": 0.1989946777054997,
243
+ "eval_runtime": 73.7234,
244
+ "eval_samples_per_second": 16.494,
245
+ "eval_steps_per_second": 2.062,
246
+ "eval_wer": 0.20101553166069294,
247
+ "eval_wil": 0.34076400679117147,
248
+ "eval_wip": 0.6592359932088285,
249
+ "step": 6000
250
+ },
251
+ {
252
+ "epoch": 2.6726973684210527,
253
+ "grad_norm": 1.212615728378296,
254
+ "learning_rate": 5.907886992348441e-06,
255
+ "loss": 0.3023,
256
+ "step": 6500
257
+ },
258
+ {
259
+ "epoch": 2.6726973684210527,
260
+ "eval_cer": 0.028579676674364896,
261
+ "eval_loss": 0.11668401211500168,
262
+ "eval_mer": 0.19840094758661533,
263
+ "eval_runtime": 73.4554,
264
+ "eval_samples_per_second": 16.554,
265
+ "eval_steps_per_second": 2.069,
266
+ "eval_wer": 0.2001194743130227,
267
+ "eval_wil": 0.34014943834106115,
268
+ "eval_wip": 0.6598505616589389,
269
+ "step": 6500
270
+ },
271
+ {
272
+ "epoch": 2.8782894736842106,
273
+ "grad_norm": 1.4651743173599243,
274
+ "learning_rate": 2.229252501471454e-06,
275
+ "loss": 0.3116,
276
+ "step": 7000
277
+ },
278
+ {
279
+ "epoch": 2.8782894736842106,
280
+ "eval_cer": 0.02839409435829759,
281
+ "eval_loss": 0.11605404317378998,
282
+ "eval_mer": 0.19668737060041408,
283
+ "eval_runtime": 73.5998,
284
+ "eval_samples_per_second": 16.522,
285
+ "eval_steps_per_second": 2.065,
286
+ "eval_wer": 0.19862604540023895,
287
+ "eval_wil": 0.3373527007482864,
288
+ "eval_wip": 0.6626472992517136,
289
+ "step": 7000
290
  }
291
  ],
292
  "logging_steps": 500,
293
+ "max_steps": 7296,
294
  "num_input_tokens_seen": 0,
295
  "num_train_epochs": 3,
296
  "save_steps": 500,
 
301
  "should_evaluate": false,
302
  "should_log": false,
303
  "should_save": true,
304
+ "should_training_stop": true
305
  },
306
  "attributes": {}
307
  }
308
  },
309
+ "total_flos": 9.992785283464022e+18,
310
+ "train_batch_size": 10,
311
  "trial_name": null,
312
  "trial_params": null
313
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1456fbb80fdcd6a8b153f11eeae0fef4bc2173125f866d139aac039bc0656f69
3
  size 5176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3bf5af7ff8411218351a777026fc80bf0652d760c3902741ad28215c5270edd0
3
  size 5176