Basma2423 commited on
Commit
c33c595
·
verified ·
1 Parent(s): 847a50b

Training in progress, step 14454

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b4b68629a4e7fbfde0f1b640d08dd2775f2c2f532f4da2add4ee14e34b66f168
3
  size 667849236
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ccde7dcbe6e25cdd0c618ccbadaa82a004cc2e139e8990a1ed95973e15de90fb
3
  size 667849236
runs/May06_08-32-58_ip-10-192-12-5/events.out.tfevents.1746520379.ip-10-192-12-5.1614.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:15f75329ed85e5259d9f5137f58b6204f020a8aea0824b5596178ecc4190cfab
3
- size 7028
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:333d6fe335443bca75bb171cad5174ecb32002e6f3ed041aff8451bf09175c6b
3
+ size 8120
trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "best_global_step": 12848,
3
- "best_metric": 0.706664474285978,
4
- "best_model_checkpoint": "checkpoints/checkpoint-12848",
5
- "epoch": 1.9999610849515508,
6
  "eval_steps": 1606,
7
- "global_step": 12848,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -279,6 +279,39 @@
279
  "eval_steps_per_second": 1.746,
280
  "eval_wer": 0.6722098612169899,
281
  "step": 12848
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
282
  }
283
  ],
284
  "logging_steps": 500,
@@ -298,7 +331,7 @@
298
  "attributes": {}
299
  }
300
  },
301
- "total_flos": 1.0027694737084908e+18,
302
  "train_batch_size": 256,
303
  "trial_name": null,
304
  "trial_params": null
 
1
  {
2
+ "best_global_step": 14454,
3
+ "best_metric": 0.7064455694431908,
4
+ "best_model_checkpoint": "checkpoints/checkpoint-14454",
5
+ "epoch": 2.2499902712378876,
6
  "eval_steps": 1606,
7
+ "global_step": 14454,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
279
  "eval_steps_per_second": 1.746,
280
  "eval_wer": 0.6722098612169899,
281
  "step": 12848
282
+ },
283
+ {
284
+ "epoch": 2.0236603494571352,
285
+ "grad_norm": 0.028502434492111206,
286
+ "learning_rate": 4.898157560336646e-05,
287
+ "loss": 0.043,
288
+ "step": 13000
289
+ },
290
+ {
291
+ "epoch": 2.101490446355606,
292
+ "grad_norm": 0.030778545886278152,
293
+ "learning_rate": 4.832692770033863e-05,
294
+ "loss": 0.0417,
295
+ "step": 13500
296
+ },
297
+ {
298
+ "epoch": 2.1793205432540765,
299
+ "grad_norm": 0.0269626472145319,
300
+ "learning_rate": 4.7517396965763394e-05,
301
+ "loss": 0.041,
302
+ "step": 14000
303
+ },
304
+ {
305
+ "epoch": 2.2499902712378876,
306
+ "eval_avg": 0.7064455694431908,
307
+ "eval_cer": 0.6538135050224774,
308
+ "eval_der": 0.7939745658437141,
309
+ "eval_loss": 0.032875534147024155,
310
+ "eval_runtime": 304.6489,
311
+ "eval_samples_per_second": 445.506,
312
+ "eval_steps_per_second": 1.743,
313
+ "eval_wer": 0.6715486374633808,
314
+ "step": 14454
315
  }
316
  ],
317
  "logging_steps": 500,
 
331
  "attributes": {}
332
  }
333
  },
334
+ "total_flos": 1.1281347889956127e+18,
335
  "train_batch_size": 256,
336
  "trial_name": null,
337
  "trial_params": null