guyhadad01 commited on
Commit
58860b4
·
verified ·
1 Parent(s): d76964e

Training in progress, step 26000, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1543,6 +1543,10 @@ You can finetune this model on your own dataset.
1543
  | 0.4541 | 25700 | 0.2669 |
1544
  | 0.4550 | 25750 | 0.3316 |
1545
  | 0.4559 | 25800 | 0.3395 |
 
 
 
 
1546
 
1547
  </details>
1548
 
 
1543
  | 0.4541 | 25700 | 0.2669 |
1544
  | 0.4550 | 25750 | 0.3316 |
1545
  | 0.4559 | 25800 | 0.3395 |
1546
+ | 0.4568 | 25850 | 0.3631 |
1547
+ | 0.4577 | 25900 | 0.3418 |
1548
+ | 0.4586 | 25950 | 0.3351 |
1549
+ | 0.4594 | 26000 | 0.3117 |
1550
 
1551
  </details>
1552
 
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bd62d182588cf8dcdefa578689850921060508dd744c2b3d5b8b216b2f913c93
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3d9b275662690960867e4c5004de25c023e37f1f7c4ebe3e55950090be859db5
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c66245bb4fd1461fe3283febbf948bf75039365f0ad45b5077d2a510d710e8d9
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ccf58858fe88830e35307ea10b8a5b6180e3bcc733d316d0262f05ad1036e132
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8a2d25e27ed0772b40c719933dfce361fb32d9594edb2389a78ead3d7c0f02d3
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa2ed85cbcfc26a558906734eea48312aeda57b3baa4220e882e04b5dde95173
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5ed2d3227321b546366709c7d41896c93e3aed6b33762555946b5ad3ddd21662
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5a1824f2390986b90c617282d9a88df5bdc60e3f12c5d84551697fb36352fa3
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2352e4a13b9010953b7c8382f227a4c5da82a9b4a73a8c91fe1b7aa1258dd370
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67c6214bd46d06bb31b87e2550447bf08cbff7452cc6c1e25562bc8a18251786
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.45590288208372354,
6
  "eval_steps": 500,
7
- "global_step": 25800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -3620,6 +3620,34 @@
3620
  "learning_rate": 3.0236987296538455e-05,
3621
  "loss": 0.3395,
3622
  "step": 25800
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3623
  }
3624
  ],
3625
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.45943701295258965,
6
  "eval_steps": 500,
7
+ "global_step": 26000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
3620
  "learning_rate": 3.0236987296538455e-05,
3621
  "loss": 0.3395,
3622
  "step": 25800
3623
+ },
3624
+ {
3625
+ "epoch": 0.45678641480094007,
3626
+ "grad_norm": 2.8250796794891357,
3627
+ "learning_rate": 3.018790127819992e-05,
3628
+ "loss": 0.3631,
3629
+ "step": 25850
3630
+ },
3631
+ {
3632
+ "epoch": 0.4576699475181566,
3633
+ "grad_norm": 1.1532173156738281,
3634
+ "learning_rate": 3.013881525986138e-05,
3635
+ "loss": 0.3418,
3636
+ "step": 25900
3637
+ },
3638
+ {
3639
+ "epoch": 0.4585534802353731,
3640
+ "grad_norm": 1.687465786933899,
3641
+ "learning_rate": 3.0089729241522846e-05,
3642
+ "loss": 0.3351,
3643
+ "step": 25950
3644
+ },
3645
+ {
3646
+ "epoch": 0.45943701295258965,
3647
+ "grad_norm": 4.05789852142334,
3648
+ "learning_rate": 3.004064322318431e-05,
3649
+ "loss": 0.3117,
3650
+ "step": 26000
3651
  }
3652
  ],
3653
  "logging_steps": 50,