Basma2423 commited on
Commit
2f7106e
·
verified ·
1 Parent(s): 169c98a

Training in progress, step 17666

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ae5d5f2467be1e0f32383e0f24718a2027023a02821399a4ab911c4727fe071e
3
  size 667849236
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc3dbc93a147703d7016436477b309809daf6cf7dfd5459380d02ef6d6acd536
3
  size 667849236
runs/May06_08-32-58_ip-10-192-12-5/events.out.tfevents.1746520379.ip-10-192-12-5.1614.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2bf97edebecbae8fc943eb5835585041af0dec87a18f100369ec0e37270d0603
3
- size 9423
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd6f2c048a39e9b58f1bdb0970c43405dcc4a73b61c2610eb9690cd98318f6e9
3
+ size 10536
trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "best_global_step": 16060,
3
- "best_metric": 0.7061941356307186,
4
- "best_model_checkpoint": "checkpoints/checkpoint-16060",
5
- "epoch": 2.4999805424757753,
6
  "eval_steps": 1606,
7
- "global_step": 16060,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -352,6 +352,39 @@
352
  "eval_steps_per_second": 1.752,
353
  "eval_wer": 0.670901504786034,
354
  "step": 16060
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
355
  }
356
  ],
357
  "logging_steps": 500,
@@ -371,7 +404,7 @@
371
  "attributes": {}
372
  }
373
  },
374
- "total_flos": 1.253480973209174e+18,
375
  "train_batch_size": 256,
376
  "trial_name": null,
377
  "trial_params": null
 
1
  {
2
+ "best_global_step": 17666,
3
+ "best_metric": 0.706001258948505,
4
+ "best_model_checkpoint": "checkpoints/checkpoint-17666",
5
+ "epoch": 2.749970813713663,
6
  "eval_steps": 1606,
7
+ "global_step": 17666,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
352
  "eval_steps_per_second": 1.752,
353
  "eval_wer": 0.670901504786034,
354
  "step": 16060
355
+ },
356
+ {
357
+ "epoch": 2.5684710277464298,
358
+ "grad_norm": 0.032605357468128204,
359
+ "learning_rate": 4.136843819999117e-05,
360
+ "loss": 0.038,
361
+ "step": 16500
362
+ },
363
+ {
364
+ "epoch": 2.6463011246449,
365
+ "grad_norm": 0.027949590235948563,
366
+ "learning_rate": 3.977561947162954e-05,
367
+ "loss": 0.0376,
368
+ "step": 17000
369
+ },
370
+ {
371
+ "epoch": 2.724131221543371,
372
+ "grad_norm": 0.026584528386592865,
373
+ "learning_rate": 3.80846956772673e-05,
374
+ "loss": 0.0372,
375
+ "step": 17500
376
+ },
377
+ {
378
+ "epoch": 2.749970813713663,
379
+ "eval_avg": 0.706001258948505,
380
+ "eval_cer": 0.6536609451579365,
381
+ "eval_der": 0.7939834810607371,
382
+ "eval_loss": 0.030004331842064857,
383
+ "eval_runtime": 304.4012,
384
+ "eval_samples_per_second": 445.869,
385
+ "eval_steps_per_second": 1.744,
386
+ "eval_wer": 0.6703593506268415,
387
+ "step": 17666
388
  }
389
  ],
390
  "logging_steps": 500,
 
404
  "attributes": {}
405
  }
406
  },
407
+ "total_flos": 1.3788271574227354e+18,
408
  "train_batch_size": 256,
409
  "trial_name": null,
410
  "trial_params": null