guyhadad01 commited on
Commit
69121a2
·
verified ·
1 Parent(s): a17b679

Training in progress, step 25800, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1539,6 +1539,10 @@ You can finetune this model on your own dataset.
1539
  | 0.4506 | 25500 | 0.3245 |
1540
  | 0.4515 | 25550 | 0.2978 |
1541
  | 0.4524 | 25600 | 0.3397 |
 
 
 
 
1542
 
1543
  </details>
1544
 
 
1539
  | 0.4506 | 25500 | 0.3245 |
1540
  | 0.4515 | 25550 | 0.2978 |
1541
  | 0.4524 | 25600 | 0.3397 |
1542
+ | 0.4533 | 25650 | 0.4655 |
1543
+ | 0.4541 | 25700 | 0.2669 |
1544
+ | 0.4550 | 25750 | 0.3316 |
1545
+ | 0.4559 | 25800 | 0.3395 |
1546
 
1547
  </details>
1548
 
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7b4c41f05edc2d7e0e5b6aa96c7280a269723970b3d9f5db97a908d698c18e46
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd62d182588cf8dcdefa578689850921060508dd744c2b3d5b8b216b2f913c93
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8ad0f634d22e8d985415b64b93836e5380971e245fef96c6b35c06a87043b680
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c66245bb4fd1461fe3283febbf948bf75039365f0ad45b5077d2a510d710e8d9
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d3d11ea4dc06732960ed6abb1d44f0f58d98e38680260f859b6e949eb007dff1
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a2d25e27ed0772b40c719933dfce361fb32d9594edb2389a78ead3d7c0f02d3
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:42f87f293944d5e456973842209f35aaec89127a12621bc86fb62b420000afe5
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ed2d3227321b546366709c7d41896c93e3aed6b33762555946b5ad3ddd21662
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0157ec5a2cd87b323072c019eeb626da0770a47c34b4436db6020558b163b6ea
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2352e4a13b9010953b7c8382f227a4c5da82a9b4a73a8c91fe1b7aa1258dd370
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.4523687512148575,
6
  "eval_steps": 500,
7
- "global_step": 25600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -3592,6 +3592,34 @@
3592
  "learning_rate": 3.0433331369892604e-05,
3593
  "loss": 0.3397,
3594
  "step": 25600
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3595
  }
3596
  ],
3597
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.45590288208372354,
6
  "eval_steps": 500,
7
+ "global_step": 25800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
3592
  "learning_rate": 3.0433331369892604e-05,
3593
  "loss": 0.3397,
3594
  "step": 25600
3595
+ },
3596
+ {
3597
+ "epoch": 0.453252283932074,
3598
+ "grad_norm": 3.319705009460449,
3599
+ "learning_rate": 3.0384245351554065e-05,
3600
+ "loss": 0.4655,
3601
+ "step": 25650
3602
+ },
3603
+ {
3604
+ "epoch": 0.45413581664929054,
3605
+ "grad_norm": 1.3729950189590454,
3606
+ "learning_rate": 3.033515933321553e-05,
3607
+ "loss": 0.2669,
3608
+ "step": 25700
3609
+ },
3610
+ {
3611
+ "epoch": 0.45501934936650706,
3612
+ "grad_norm": 1.3527820110321045,
3613
+ "learning_rate": 3.028607331487699e-05,
3614
+ "loss": 0.3316,
3615
+ "step": 25750
3616
+ },
3617
+ {
3618
+ "epoch": 0.45590288208372354,
3619
+ "grad_norm": 1.4500503540039062,
3620
+ "learning_rate": 3.0236987296538455e-05,
3621
+ "loss": 0.3395,
3622
+ "step": 25800
3623
  }
3624
  ],
3625
  "logging_steps": 50,