Basma2423 commited on
Commit
627dc76
·
verified ·
1 Parent(s): 7554217

Training in progress, step 16060

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ccde7dcbe6e25cdd0c618ccbadaa82a004cc2e139e8990a1ed95973e15de90fb
3
  size 667849236
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae5d5f2467be1e0f32383e0f24718a2027023a02821399a4ab911c4727fe071e
3
  size 667849236
runs/May06_08-32-58_ip-10-192-12-5/events.out.tfevents.1746520379.ip-10-192-12-5.1614.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:333d6fe335443bca75bb171cad5174ecb32002e6f3ed041aff8451bf09175c6b
3
- size 8120
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2bf97edebecbae8fc943eb5835585041af0dec87a18f100369ec0e37270d0603
3
+ size 9423
trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "best_global_step": 14454,
3
- "best_metric": 0.7064455694431908,
4
- "best_model_checkpoint": "checkpoints/checkpoint-14454",
5
- "epoch": 2.2499902712378876,
6
  "eval_steps": 1606,
7
- "global_step": 14454,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -312,6 +312,46 @@
312
  "eval_steps_per_second": 1.743,
313
  "eval_wer": 0.6715486374633808,
314
  "step": 14454
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
315
  }
316
  ],
317
  "logging_steps": 500,
@@ -331,7 +371,7 @@
331
  "attributes": {}
332
  }
333
  },
334
- "total_flos": 1.1281347889956127e+18,
335
  "train_batch_size": 256,
336
  "trial_name": null,
337
  "trial_params": null
 
1
  {
2
+ "best_global_step": 16060,
3
+ "best_metric": 0.7061941356307186,
4
+ "best_model_checkpoint": "checkpoints/checkpoint-16060",
5
+ "epoch": 2.4999805424757753,
6
  "eval_steps": 1606,
7
+ "global_step": 16060,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
312
  "eval_steps_per_second": 1.743,
313
  "eval_wer": 0.6715486374633808,
314
  "step": 14454
315
+ },
316
+ {
317
+ "epoch": 2.257150640152547,
318
+ "grad_norm": 0.03818966820836067,
319
+ "learning_rate": 4.6558358407185946e-05,
320
+ "loss": 0.0402,
321
+ "step": 14500
322
+ },
323
+ {
324
+ "epoch": 2.3349807370510174,
325
+ "grad_norm": 0.029628828167915344,
326
+ "learning_rate": 4.5456179713031586e-05,
327
+ "loss": 0.0395,
328
+ "step": 15000
329
+ },
330
+ {
331
+ "epoch": 2.4128108339494885,
332
+ "grad_norm": 0.02792350761592388,
333
+ "learning_rate": 4.4218178973329804e-05,
334
+ "loss": 0.0392,
335
+ "step": 15500
336
+ },
337
+ {
338
+ "epoch": 2.4906409308479587,
339
+ "grad_norm": 0.03364017978310585,
340
+ "learning_rate": 4.2852576090096216e-05,
341
+ "loss": 0.0384,
342
+ "step": 16000
343
+ },
344
+ {
345
+ "epoch": 2.4999805424757753,
346
+ "eval_avg": 0.7061941356307186,
347
+ "eval_cer": 0.6537081045699137,
348
+ "eval_der": 0.7939727975362082,
349
+ "eval_loss": 0.031167298555374146,
350
+ "eval_runtime": 303.0246,
351
+ "eval_samples_per_second": 447.894,
352
+ "eval_steps_per_second": 1.752,
353
+ "eval_wer": 0.670901504786034,
354
+ "step": 16060
355
  }
356
  ],
357
  "logging_steps": 500,
 
371
  "attributes": {}
372
  }
373
  },
374
+ "total_flos": 1.253480973209174e+18,
375
  "train_batch_size": 256,
376
  "trial_name": null,
377
  "trial_params": null